diff --git "a/openvino_model.xml" "b/openvino_model.xml" new file mode 100644--- /dev/null +++ "b/openvino_model.xml" @@ -0,0 +1,113009 @@ +<?xml version="1.0"?> +<net name="Model0" version="11"> + <layers> + <layer id="3" name="input_ids" type="Parameter" version="opset1"> + <data shape="?,?" element_type="i64" /> + <output> + <port id="0" precision="I64" names="input_ids"> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="2" name="attention_mask" type="Parameter" version="opset1"> + <data shape="?,?" element_type="i64" /> + <output> + <port id="0" precision="I64" names="attention_mask"> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="1" name="position_ids" type="Parameter" version="opset1"> + <data shape="?,?" element_type="i64" /> + <output> + <port id="0" precision="I64" names="position_ids"> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="0" name="beam_idx" type="Parameter" version="opset1"> + <data shape="?" element_type="i32" /> + <output> + <port id="0" precision="I32" names="beam_idx"> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="4" name="Constant_432625" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="5" name="ShapeOf_432611" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="I64"> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="6" name="Constant_432613" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7" name="Constant_432615" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="8" name="Gather_432616" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9" name="Constant_432618" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10" name="Constant_432620" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11" name="Constant_432622" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="12" name="Concat_432623" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="13" name="Broadcast_432626" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="14" name="ReadValue_417408" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.9.valuepresent.9.value" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.9.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="15" name="Constant_401947" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="16" name="Gather_401948" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="17" name="self.model.gpt_neox.embed_in.weight" type="Const" version="opset1"> + <data element_type="u8" shape="50432, 4096" offset="28" size="206569472" /> + <output> + <port id="0" precision="U8"> + <dim>50432</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="18" name="Convert_448844" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>50432</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>50432</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="19" name="self.model.gpt_neox.embed_in.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="50432, 1" offset="206569500" size="50432" /> + <output> + <port id="0" precision="U8"> + <dim>50432</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="20" name="Convert_448847" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>50432</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>50432</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="21" name="self.model.gpt_neox.embed_in.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>50432</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>50432</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>50432</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="22" name="self.model.gpt_neox.embed_in.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="50432, 1" offset="206619932" size="100864" /> + <output> + <port id="0" precision="FP16"> + <dim>50432</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="23" name="self.model.gpt_neox.embed_in.weight/fq_weights_0" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>50432</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>50432</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>50432</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="24" name="self.model.gpt_neox.embed_in.weight/fq_weights_0/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>50432</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>50432</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="25" name="__module.model.gpt_neox.embed_in/aten::embedding/Convert" type="Convert" version="opset1"> + <data destination_type="i32" /> + <input> + <port id="0" precision="I64"> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="26" name="__module.model.gpt_neox.embed_in/aten::embedding/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="27" name="__module.model.gpt_neox.embed_in/aten::embedding/Gather" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>50432</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="306,input.1"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="28" name="__module.model.gpt_neox.layers.0.input_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="29" name="__module.model.gpt_neox.layers.0.input_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="30" name="Constant_325188" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="206720800" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="31" name="__module.model.gpt_neox.layers.0.input_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="32" name="Constant_325189" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="206737184" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="33" name="__module.model.gpt_neox.layers.0.input_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="315"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="34" name="self.model.gpt_neox.layers.0.attention.query_key_value.weight" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 4096" offset="206753568" size="50331648" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="35" name="Convert_448855" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="36" name="self.model.gpt_neox.layers.0.attention.query_key_value.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 1" offset="257085216" size="12288" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="37" name="Convert_448858" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="38" name="self.model.gpt_neox.layers.0.attention.query_key_value.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="39" name="self.model.gpt_neox.layers.0.attention.query_key_value.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="12288, 1" offset="257097504" size="24576" /> + <output> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="40" name="self.model.gpt_neox.layers.0.attention.query_key_value.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="41" name="self.model.gpt_neox.layers.0.attention.query_key_value.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="42" name="__module.model.gpt_neox.layers.0.attention.query_key_value/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="43" name="Constant_325190" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 12288" offset="257122080" size="49152" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="44" name="__module.model.gpt_neox.layers.0.attention.query_key_value/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="322,qkv.1"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="45" name="__module.model.gpt_neox.layers.0.attention/prim::ListConstruct/Concat" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171232" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="46" name="__module.model.gpt_neox.layers.0.attention/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="326,qkv.3"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + </output> + </layer> + <layer id="47" name="Constant_294370" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="48" name="Constant_294373" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="49" name="Constant_294376" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="50" name="__module.model.gpt_neox.layers.0.attention/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="327"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="51" name="Constant_222" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="328"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="52" name="__module.model.gpt_neox.layers.0.attention/aten::permute/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="329,query.1"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="53" name="Constant_294382" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="54" name="Constant_294385" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="55" name="Constant_294388" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="56" name="__module.model.gpt_neox.layers.0.attention/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="336,q.1"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="57" name="self.model.gpt_neox.layers.0.attention.rotary_emb.cos_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="257171392" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.0.attention.rotary_emb.cos_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="58" name="__module.model.gpt_neox.layers.0.attention.rotary_emb/aten::slice/Unsqueeze" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="59" name="Constant_294394" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="60" name="Constant_294397" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="61" name="Constant_294400" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="62" name="__module.model.gpt_neox.layers.0.attention/aten::slice/Slice_2" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="330"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="63" name="ShapeOf_337904" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="64" name="Constant_340970" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="65" name="Constant_337906" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="66" name="Gather_337907" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="340"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="67" name="Constant_432638" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="68" name="Constant_432631" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="69" name="Constant_432633" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="70" name="Constant_432635" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="71" name="Concat_432636" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="72" name="Broadcast_432639" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="73" name="ReadValue_417282" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.0.keypresent.0.key" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.0.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="74" name="Constant_401890" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="75" name="Gather_401891" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="76" name="ShapeOf_337909" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="77" name="Constant_337910" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="78" name="Constant_337911" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="79" name="Gather_337912" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="342" /> + </output> + </layer> + <layer id="80" name="Constant_337582" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="81" name="Reshape_340905" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="82" name="__module.model.gpt_neox.layers.0.attention/aten::add_/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="341,345,346,seq_len.1"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="83" name="__module.model.gpt_neox.layers.0.attention.rotary_emb/aten::slice/Unsqueeze_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="84" name="__module.model.gpt_neox.layers.0.attention.rotary_emb/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="349,352,cos.1"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="85" name="__module.model.gpt_neox.layers.0.attention/aten::index/Convert" type="Convert" version="opset1"> + <data destination_type="i32" /> + <input> + <port id="0" precision="I64"> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="86" name="Constant_38227" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="87" name="__module.model.gpt_neox.layers.0.attention/aten::index/Gather" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="355"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="88" name="205" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64" names="205" /> + </output> + </layer> + <layer id="89" name="__module.model.gpt_neox.layers.0.attention/aten::unsqueeze/Unsqueeze" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="356,cos.3"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="90" name="__module.model.gpt_neox.layers.0.attention/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="360"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="91" name="Constant_294405" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="92" name="Constant_294404" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="93" name="__module.model.gpt_neox.layers.0.attention/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="94" name="207" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64" names="207" /> + </output> + </layer> + <layer id="95" name="__module.model.gpt_neox.layers.0.attention/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="96" name="__module.model.gpt_neox.layers.0.attention/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="361,366" /> + </output> + </layer> + <layer id="97" name="Constant_57" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" names="219" /> + </output> + </layer> + <layer id="98" name="__module.model.gpt_neox.layers.0.attention/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="99" name="__module.model.gpt_neox.layers.0.attention/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="363,364,368,369" /> + </output> + </layer> + <layer id="100" name="Constant_337584" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="101" name="__module.model.gpt_neox.layers.0.attention/aten::slice/Unsqueeze_17" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="102" name="Constant_294403" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="103" name="ScatterUpdate_294406" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="104" name="Constant_294409" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="105" name="Constant_294412" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="106" name="__module.model.gpt_neox.layers.0.attention/aten::slice/Slice_3" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="370,x2.1"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="107" name="Constant_325191" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="108" name="__module.model.gpt_neox.layers.0.attention/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="371"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="109" name="Constant_294457" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="110" name="Constant_294462" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="111" name="__module.model.gpt_neox.layers.0.attention/aten::slice/Slice_4" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="365"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="112" name="__module.model.gpt_neox.layers.0.attention/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="373"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="113" name="self.model.gpt_neox.layers.0.attention.rotary_emb.sin_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="258220060" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.0.attention.rotary_emb.sin_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="114" name="__module.model.gpt_neox.layers.0.attention.rotary_emb/aten::slice/Unsqueeze_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="115" name="__module.model.gpt_neox.layers.0.attention.rotary_emb/aten::slice/Unsqueeze_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="116" name="__module.model.gpt_neox.layers.0.attention.rotary_emb/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="350,353,sin.1"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="117" name="Constant_38230" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="118" name="__module.model.gpt_neox.layers.0.attention/aten::index/Gather_1" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="358"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="119" name="__module.model.gpt_neox.layers.0.attention/aten::unsqueeze/Unsqueeze_1" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="359,sin.3"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="120" name="__module.model.gpt_neox.layers.0.attention/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="374"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="121" name="__module.model.gpt_neox.layers.0.attention/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="375,393,403,query.3,query.5"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="122" name="Constant_236" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="331"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="123" name="__module.model.gpt_neox.layers.0.attention/aten::permute/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="332,key.1"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="124" name="Constant_294508" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="125" name="Constant_294511" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="126" name="Constant_294514" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="127" name="__module.model.gpt_neox.layers.0.attention/aten::slice/Slice_6" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="338,k.1"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="128" name="__module.model.gpt_neox.layers.0.attention/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="376"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="129" name="Constant_294518" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="130" name="Constant_294517" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="131" name="__module.model.gpt_neox.layers.0.attention/aten::size/ShapeOf_7" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="132" name="__module.model.gpt_neox.layers.0.attention/aten::size/Constant_7" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="133" name="__module.model.gpt_neox.layers.0.attention/aten::size/Gather_7" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="377,382" /> + </output> + </layer> + <layer id="134" name="__module.model.gpt_neox.layers.0.attention/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="135" name="__module.model.gpt_neox.layers.0.attention/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="379,380,384,385" /> + </output> + </layer> + <layer id="136" name="Constant_337586" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="137" name="__module.model.gpt_neox.layers.0.attention/aten::slice/Unsqueeze_33" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="138" name="Constant_294516" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="139" name="ScatterUpdate_294519" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="140" name="Constant_294522" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="141" name="Constant_294525" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="142" name="__module.model.gpt_neox.layers.0.attention/aten::slice/Slice_7" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="386,x2.3"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="143" name="Constant_325192" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="144" name="__module.model.gpt_neox.layers.0.attention/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="387"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="145" name="Constant_294570" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="146" name="Constant_294575" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="147" name="__module.model.gpt_neox.layers.0.attention/aten::slice/Slice_8" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="381"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="148" name="__module.model.gpt_neox.layers.0.attention/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="389"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="149" name="__module.model.gpt_neox.layers.0.attention/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="390"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="150" name="__module.model.gpt_neox.layers.0.attention/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="391,395"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="151" name="__module.model.gpt_neox.layers.0.attention/aten::to/Convert_1" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.0.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="152" name="Constant_432651" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="153" name="Constant_432644" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="154" name="Constant_432646" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="155" name="Constant_432648" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="156" name="Concat_432649" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="157" name="Broadcast_432652" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="158" name="ReadValue_417284" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.0.valuepresent.0.value" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.0.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="159" name="Constant_401893" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="160" name="Gather_401894" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="161" name="Constant_294620" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="162" name="Constant_294623" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="163" name="Constant_294626" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="164" name="__module.model.gpt_neox.layers.0.attention/aten::slice/Slice_10" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="333"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="165" name="Constant_250" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="334"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="166" name="__module.model.gpt_neox.layers.0.attention/aten::permute/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="335"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="167" name="__module.model.gpt_neox.layers.0.attention/aten::cat/Concat_5" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.0.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="168" name="__module.model.gpt_neox.layers.0.attention/aten::slice/Slice_11" type="Const" version="opset1"> + <data element_type="boolean" shape="1, 1, 2048, 2048" offset="259268636" size="4194304" /> + <output> + <port id="0" precision="BOOL" names="412"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="169" name="Constant_294630" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="170" name="Constant_294629" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="171" name="ShapeOf_337914" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="172" name="Constant_337915" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="173" name="Constant_337916" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="174" name="Gather_337917" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" /> + </output> + </layer> + <layer id="175" name="Add_337918" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="407" /> + </output> + </layer> + <layer id="176" name="ShapeOf_337985" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="177" name="Constant_337986" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="178" name="Constant_337987" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="179" name="Gather_337988" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="405" /> + </output> + </layer> + <layer id="180" name="__module.model.gpt_neox.layers.0.attention/aten::sub/Subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="409,410" /> + </output> + </layer> + <layer id="181" name="Constant_337588" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="182" name="__module.model.gpt_neox.layers.0.attention/aten::slice/Unsqueeze_44" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="183" name="Constant_294628" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="184" name="ScatterUpdate_294631" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="185" name="Constant_294632" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="186" name="Constant_337590" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="187" name="__module.model.gpt_neox.layers.0.attention/aten::slice/Unsqueeze_45" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="188" name="ScatterUpdate_294633" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="189" name="Constant_294636" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462964" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="190" name="__module.model.gpt_neox.layers.0.attention/aten::slice/Slice_12" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 0" end_mask="1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + <port id="2" precision="I64"> + <dim>3</dim> + </port> + <port id="3" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="413"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="191" name="Constant_294709" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="192" name="Constant_294710" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="193" name="Constant_294706" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="194" name="Constant_294705" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="195" name="ScatterUpdate_294711" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="196" name="Constant_294714" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="197" name="__module.model.gpt_neox.layers.0.attention/aten::slice/Slice_13" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="414,415"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="198" name="__module.model.gpt_neox.layers.0.attention/aten::where/Convert_1" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="199" name="__module.model.gpt_neox.layers.0.attention/aten::full/Convert" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="263462988" size="4" /> + <output> + <port id="0" precision="FP32" names="402" /> + </output> + </layer> + <layer id="200" name="__module.model.gpt_neox.layers.0.attention/aten::where/Select" type="Select" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32" /> + <port id="2" precision="FP32" /> + </input> + <output> + <port id="3" precision="FP32" names="416,causal_mask.1"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="201" name="Constant_325194" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="263462992" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="202" name="ShapeOf_337990" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="I64"> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="203" name="Constant_337991" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="204" name="Constant_337992" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="205" name="Gather_337993" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="295"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="206" name="__module.model.gpt_neox.layers.0.attention/prim::ListConstruct/Reshape_0_1" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="263462996" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="207" name="__module.model.gpt_neox/prim::ListConstruct/Concat" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="296"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="208" name="__module.model.gpt_neox/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="297,298,attention_mask.3"> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="209" name="Constant_337592" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="263463004" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="210" name="__module.model.gpt_neox/aten::unsqueeze/Unsqueeze_1" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="I64"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="300,301,attention_mask.5"> + <dim>-1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="211" name="__module.model.gpt_neox/aten::to/Convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="I64"> + <dim>-1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="302"> + <dim>-1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="212" name="Constant_325193" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="263462992" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="213" name="__module.model.gpt_neox/aten::rsub/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="214" name="__module.model.gpt_neox/aten::rsub/Subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="303"> + <dim>-1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="215" name="Constant_325195" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="263462988" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="216" name="__module.model.gpt_neox/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="304,attention_mask"> + <dim>-1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="217" name="Add_314988" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="218" name="ShapeOf_314989" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="219" name="Constant_337996" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="220" name="Constant_337997" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="221" name="Gather_337998" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="400"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="222" name="Constant_267961" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="223" name="Constant_267963" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="224" name="Constant_267965" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="225" name="__module.model.gpt_neox.layers.0.attention/prim::ListConstruct/Concat_1" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="417"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="226" name="Maximum_314990" type="Maximum" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="227" name="__module.model.gpt_neox.layers.0.attention/aten::add/Add_2" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="419"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="228" name="__module.model.gpt_neox.layers.0.attention/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="420,421,sdpa_result.1,tensor.1"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="229" name="Constant_691" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="422"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="230" name="__module.model.gpt_neox.layers.0.attention/aten::permute/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="423"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="231" name="__module.model.gpt_neox.layers.0.attention/prim::ListConstruct/Concat_2" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263463020" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="232" name="__module.model.gpt_neox.layers.0.attention/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="428"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="233" name="self.model.gpt_neox.layers.0.attention.dense.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 4096" offset="263463044" size="16777216" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="234" name="Convert_448866" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="235" name="self.model.gpt_neox.layers.0.attention.dense.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="280240260" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="236" name="Convert_448869" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="237" name="self.model.gpt_neox.layers.0.attention.dense.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="238" name="self.model.gpt_neox.layers.0.attention.dense.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="280244356" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="239" name="self.model.gpt_neox.layers.0.attention.dense.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="240" name="self.model.gpt_neox.layers.0.attention.dense.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="241" name="__module.model.gpt_neox.layers.0.attention.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="242" name="Constant_325196" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="280252548" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="243" name="__module.model.gpt_neox.layers.0.attention.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="431,433,input.3"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="244" name="__module.model.gpt_neox.layers.0/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="437,attn_output.3"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="245" name="__module.model.gpt_neox.layers.0.post_attention_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="246" name="__module.model.gpt_neox.layers.0.post_attention_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="247" name="Constant_325197" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="280268932" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="248" name="__module.model.gpt_neox.layers.0.post_attention_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="249" name="Constant_325198" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="280285316" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="250" name="__module.model.gpt_neox.layers.0.post_attention_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="441"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="251" name="self.model.gpt_neox.layers.0.mlp.dense_h_to_4h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 4096" offset="280301700" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="252" name="Convert_448877" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="253" name="self.model.gpt_neox.layers.0.mlp.dense_h_to_4h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 1" offset="347410564" size="16384" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="254" name="Convert_448880" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="255" name="self.model.gpt_neox.layers.0.mlp.dense_h_to_4h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="256" name="self.model.gpt_neox.layers.0.mlp.dense_h_to_4h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="16384, 1" offset="347426948" size="32768" /> + <output> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="257" name="self.model.gpt_neox.layers.0.mlp.dense_h_to_4h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="258" name="self.model.gpt_neox.layers.0.mlp.dense_h_to_4h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="259" name="__module.model.gpt_neox.layers.0.mlp.dense_h_to_4h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="260" name="Constant_325199" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 16384" offset="347459716" size="65536" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="261" name="__module.model.gpt_neox.layers.0.mlp.dense_h_to_4h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="446"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="262" name="__module.model.gpt_neox.layers.0.mlp.act/aten::gelu/Gelu" type="Gelu" version="opset7"> + <data approximation_mode="ERF" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="447"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="263" name="self.model.gpt_neox.layers.0.mlp.dense_4h_to_h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 16384" offset="347525252" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="264" name="Convert_448888" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="265" name="self.model.gpt_neox.layers.0.mlp.dense_4h_to_h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="414634116" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="266" name="Convert_448891" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="267" name="self.model.gpt_neox.layers.0.mlp.dense_4h_to_h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="268" name="self.model.gpt_neox.layers.0.mlp.dense_4h_to_h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="414638212" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="269" name="self.model.gpt_neox.layers.0.mlp.dense_4h_to_h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="270" name="self.model.gpt_neox.layers.0.mlp.dense_4h_to_h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="271" name="__module.model.gpt_neox.layers.0.mlp.dense_4h_to_h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="272" name="Constant_325200" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="414646404" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="273" name="__module.model.gpt_neox.layers.0.mlp.dense_4h_to_h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="450,input.5"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="274" name="__module.model.gpt_neox.layers.0/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="452,454,hidden_states.3"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="275" name="__module.model.gpt_neox.layers.1.input_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="276" name="__module.model.gpt_neox.layers.1.input_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="277" name="Constant_325201" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="414662788" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="278" name="__module.model.gpt_neox.layers.1.input_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="279" name="Constant_325202" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="414679172" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="280" name="__module.model.gpt_neox.layers.1.input_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="464"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="281" name="self.model.gpt_neox.layers.1.attention.query_key_value.weight" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 4096" offset="414695556" size="50331648" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="282" name="Convert_448899" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="283" name="self.model.gpt_neox.layers.1.attention.query_key_value.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 1" offset="465027204" size="12288" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="284" name="Convert_448902" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="285" name="self.model.gpt_neox.layers.1.attention.query_key_value.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="286" name="self.model.gpt_neox.layers.1.attention.query_key_value.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="12288, 1" offset="465039492" size="24576" /> + <output> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="287" name="self.model.gpt_neox.layers.1.attention.query_key_value.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="288" name="self.model.gpt_neox.layers.1.attention.query_key_value.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="289" name="__module.model.gpt_neox.layers.1.attention.query_key_value/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="290" name="Constant_325203" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 12288" offset="465064068" size="49152" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="291" name="__module.model.gpt_neox.layers.1.attention.query_key_value/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="471,qkv.5"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="292" name="__module.model.gpt_neox.layers.1.attention/prim::ListConstruct/Concat" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171232" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="293" name="__module.model.gpt_neox.layers.1.attention/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="475,qkv.7"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + </output> + </layer> + <layer id="294" name="Constant_294734" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="295" name="Constant_294737" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="296" name="Constant_294740" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="297" name="__module.model.gpt_neox.layers.1.attention/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="476"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="298" name="Constant_803" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="477"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="299" name="__module.model.gpt_neox.layers.1.attention/aten::permute/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="478,query.7"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="300" name="Constant_294746" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="301" name="Constant_294749" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="302" name="Constant_294752" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="303" name="__module.model.gpt_neox.layers.1.attention/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="485,q.3"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="304" name="self.model.gpt_neox.layers.1.attention.rotary_emb.cos_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="257171392" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.1.attention.rotary_emb.cos_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="305" name="__module.model.gpt_neox.layers.1.attention.rotary_emb/aten::slice/Unsqueeze" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="306" name="Constant_294758" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="307" name="Constant_294761" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="308" name="Constant_294764" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="309" name="__module.model.gpt_neox.layers.1.attention/aten::slice/Slice_2" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="479"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="310" name="ShapeOf_338000" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="311" name="Constant_340973" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="312" name="Constant_338002" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="313" name="Gather_338003" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="489"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="314" name="Constant_432664" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="315" name="Constant_432657" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="316" name="Constant_432659" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="317" name="Constant_432661" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="318" name="Concat_432662" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="319" name="Broadcast_432665" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="320" name="ReadValue_417286" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.1.keypresent.1.key" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.1.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="321" name="Constant_401896" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="322" name="Gather_401897" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="323" name="ShapeOf_338005" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="324" name="Constant_338006" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="325" name="Constant_338007" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="326" name="Gather_338008" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="491" /> + </output> + </layer> + <layer id="327" name="Constant_337594" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="328" name="Reshape_340907" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="329" name="__module.model.gpt_neox.layers.1.attention/aten::add_/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="490,494,495,seq_len.5"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="330" name="__module.model.gpt_neox.layers.1.attention.rotary_emb/aten::slice/Unsqueeze_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="331" name="__module.model.gpt_neox.layers.1.attention.rotary_emb/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="498,501,cos.5"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="332" name="Constant_38233" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="333" name="__module.model.gpt_neox.layers.1.attention/aten::index/Gather" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="504"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="334" name="__module.model.gpt_neox.layers.1.attention/aten::unsqueeze/Unsqueeze" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="505,cos.7"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="335" name="__module.model.gpt_neox.layers.1.attention/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="509"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="336" name="Constant_294769" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="337" name="Constant_294768" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="338" name="__module.model.gpt_neox.layers.1.attention/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="339" name="__module.model.gpt_neox.layers.1.attention/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="340" name="__module.model.gpt_neox.layers.1.attention/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="510,515" /> + </output> + </layer> + <layer id="341" name="__module.model.gpt_neox.layers.1.attention/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="342" name="__module.model.gpt_neox.layers.1.attention/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="512,513,517,518" /> + </output> + </layer> + <layer id="343" name="Constant_337596" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="344" name="__module.model.gpt_neox.layers.1.attention/aten::slice/Unsqueeze_17" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="345" name="Constant_294767" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="346" name="ScatterUpdate_294770" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="347" name="Constant_294773" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="348" name="Constant_294776" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="349" name="__module.model.gpt_neox.layers.1.attention/aten::slice/Slice_3" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="519,x2.5"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="350" name="Constant_325204" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="351" name="__module.model.gpt_neox.layers.1.attention/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="520"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="352" name="Constant_294821" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="353" name="Constant_294826" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="354" name="__module.model.gpt_neox.layers.1.attention/aten::slice/Slice_4" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="514"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="355" name="__module.model.gpt_neox.layers.1.attention/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="522"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="356" name="self.model.gpt_neox.layers.1.attention.rotary_emb.sin_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="258220060" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.1.attention.rotary_emb.sin_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="357" name="__module.model.gpt_neox.layers.1.attention.rotary_emb/aten::slice/Unsqueeze_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="358" name="__module.model.gpt_neox.layers.1.attention.rotary_emb/aten::slice/Unsqueeze_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="359" name="__module.model.gpt_neox.layers.1.attention.rotary_emb/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="499,502,sin.5"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="360" name="Constant_38236" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="361" name="__module.model.gpt_neox.layers.1.attention/aten::index/Gather_1" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="507"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="362" name="__module.model.gpt_neox.layers.1.attention/aten::unsqueeze/Unsqueeze_1" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="508,sin.7"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="363" name="__module.model.gpt_neox.layers.1.attention/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="523"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="364" name="__module.model.gpt_neox.layers.1.attention/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="524,542,552,query.11,query.9"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="365" name="Constant_817" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="480"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="366" name="__module.model.gpt_neox.layers.1.attention/aten::permute/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="481,key.7"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="367" name="Constant_294872" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="368" name="Constant_294875" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="369" name="Constant_294878" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="370" name="__module.model.gpt_neox.layers.1.attention/aten::slice/Slice_6" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="487,k.3"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="371" name="__module.model.gpt_neox.layers.1.attention/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="525"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="372" name="Constant_294882" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="373" name="Constant_294881" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="374" name="__module.model.gpt_neox.layers.1.attention/aten::size/ShapeOf_7" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="375" name="__module.model.gpt_neox.layers.1.attention/aten::size/Constant_7" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="376" name="__module.model.gpt_neox.layers.1.attention/aten::size/Gather_7" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="526,531" /> + </output> + </layer> + <layer id="377" name="__module.model.gpt_neox.layers.1.attention/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="378" name="__module.model.gpt_neox.layers.1.attention/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="528,529,533,534" /> + </output> + </layer> + <layer id="379" name="Constant_337598" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="380" name="__module.model.gpt_neox.layers.1.attention/aten::slice/Unsqueeze_33" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="381" name="Constant_294880" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="382" name="ScatterUpdate_294883" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="383" name="Constant_294886" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="384" name="Constant_294889" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="385" name="__module.model.gpt_neox.layers.1.attention/aten::slice/Slice_7" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="535,x2.7"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="386" name="Constant_325205" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="387" name="__module.model.gpt_neox.layers.1.attention/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="536"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="388" name="Constant_294934" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="389" name="Constant_294939" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="390" name="__module.model.gpt_neox.layers.1.attention/aten::slice/Slice_8" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="530"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="391" name="__module.model.gpt_neox.layers.1.attention/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="538"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="392" name="__module.model.gpt_neox.layers.1.attention/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="539"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="393" name="__module.model.gpt_neox.layers.1.attention/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="540,544"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="394" name="__module.model.gpt_neox.layers.1.attention/aten::to/Convert_1" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.1.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="395" name="Constant_432677" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="396" name="Constant_432670" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="397" name="Constant_432672" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="398" name="Constant_432674" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="399" name="Concat_432675" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="400" name="Broadcast_432678" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="401" name="ReadValue_417288" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.1.valuepresent.1.value" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.1.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="402" name="Constant_401899" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="403" name="Gather_401900" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="404" name="Constant_294984" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="405" name="Constant_294987" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="406" name="Constant_294990" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="407" name="__module.model.gpt_neox.layers.1.attention/aten::slice/Slice_10" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="482"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="408" name="Constant_831" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="483"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="409" name="__module.model.gpt_neox.layers.1.attention/aten::permute/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="484"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="410" name="__module.model.gpt_neox.layers.1.attention/aten::cat/Concat_5" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.1.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="411" name="__module.model.gpt_neox.layers.1.attention/aten::slice/Slice_11" type="Const" version="opset1"> + <data element_type="boolean" shape="1, 1, 2048, 2048" offset="259268636" size="4194304" /> + <output> + <port id="0" precision="BOOL" names="561"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="412" name="Constant_294994" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="413" name="Constant_294993" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="414" name="ShapeOf_338010" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="415" name="Constant_338011" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="416" name="Constant_338012" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="417" name="Gather_338013" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" /> + </output> + </layer> + <layer id="418" name="Add_338014" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="556" /> + </output> + </layer> + <layer id="419" name="ShapeOf_338081" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="420" name="Constant_338082" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="421" name="Constant_338083" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="422" name="Gather_338084" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="554" /> + </output> + </layer> + <layer id="423" name="__module.model.gpt_neox.layers.1.attention/aten::sub/Subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="558,559" /> + </output> + </layer> + <layer id="424" name="Constant_337600" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="425" name="__module.model.gpt_neox.layers.1.attention/aten::slice/Unsqueeze_44" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="426" name="Constant_294992" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="427" name="ScatterUpdate_294995" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="428" name="Constant_294996" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="429" name="Constant_337602" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="430" name="__module.model.gpt_neox.layers.1.attention/aten::slice/Unsqueeze_45" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="431" name="ScatterUpdate_294997" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="432" name="Constant_295000" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462964" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="433" name="__module.model.gpt_neox.layers.1.attention/aten::slice/Slice_12" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 0" end_mask="1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + <port id="2" precision="I64"> + <dim>3</dim> + </port> + <port id="3" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="562"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="434" name="Constant_295073" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="435" name="Constant_295074" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="436" name="Constant_295070" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="437" name="Constant_295069" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="438" name="ScatterUpdate_295075" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="439" name="Constant_295078" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="440" name="__module.model.gpt_neox.layers.1.attention/aten::slice/Slice_13" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="563,564"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="441" name="__module.model.gpt_neox.layers.1.attention/aten::where/Convert_1" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="442" name="__module.model.gpt_neox.layers.1.attention/aten::full/Convert" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="263462988" size="4" /> + <output> + <port id="0" precision="FP32" names="551" /> + </output> + </layer> + <layer id="443" name="__module.model.gpt_neox.layers.1.attention/aten::where/Select" type="Select" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32" /> + <port id="2" precision="FP32" /> + </input> + <output> + <port id="3" precision="FP32" names="565,causal_mask.5"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="444" name="Add_315060" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="445" name="ShapeOf_315061" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="446" name="Constant_338087" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="447" name="Constant_338088" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="448" name="Gather_338089" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="549"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="449" name="Constant_267971" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="450" name="Constant_267973" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="451" name="Constant_267975" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="452" name="__module.model.gpt_neox.layers.1.attention/prim::ListConstruct/Concat_1" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="566"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="453" name="Maximum_315062" type="Maximum" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="454" name="__module.model.gpt_neox.layers.1.attention/aten::add/Add_2" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="568"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="455" name="__module.model.gpt_neox.layers.1.attention/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="569,570,sdpa_result.3,tensor.5"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="456" name="Constant_1272" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="571"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="457" name="__module.model.gpt_neox.layers.1.attention/aten::permute/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="572"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="458" name="__module.model.gpt_neox.layers.1.attention/prim::ListConstruct/Concat_2" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263463020" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="459" name="__module.model.gpt_neox.layers.1.attention/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="577"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="460" name="self.model.gpt_neox.layers.1.attention.dense.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 4096" offset="465113220" size="16777216" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="461" name="Convert_448910" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="462" name="self.model.gpt_neox.layers.1.attention.dense.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="481890436" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="463" name="Convert_448913" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="464" name="self.model.gpt_neox.layers.1.attention.dense.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="465" name="self.model.gpt_neox.layers.1.attention.dense.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="481894532" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="466" name="self.model.gpt_neox.layers.1.attention.dense.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="467" name="self.model.gpt_neox.layers.1.attention.dense.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="468" name="__module.model.gpt_neox.layers.1.attention.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="469" name="Constant_325206" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="481902724" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="470" name="__module.model.gpt_neox.layers.1.attention.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="580,582,input.7"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="471" name="__module.model.gpt_neox.layers.1/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="586,attn_output.7"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="472" name="__module.model.gpt_neox.layers.1.post_attention_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="473" name="__module.model.gpt_neox.layers.1.post_attention_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="474" name="Constant_325207" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="481919108" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="475" name="__module.model.gpt_neox.layers.1.post_attention_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="476" name="Constant_325208" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="481935492" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="477" name="__module.model.gpt_neox.layers.1.post_attention_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="590"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="478" name="self.model.gpt_neox.layers.1.mlp.dense_h_to_4h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 4096" offset="481951876" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="479" name="Convert_448921" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="480" name="self.model.gpt_neox.layers.1.mlp.dense_h_to_4h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 1" offset="549060740" size="16384" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="481" name="Convert_448924" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="482" name="self.model.gpt_neox.layers.1.mlp.dense_h_to_4h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="483" name="self.model.gpt_neox.layers.1.mlp.dense_h_to_4h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="16384, 1" offset="549077124" size="32768" /> + <output> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="484" name="self.model.gpt_neox.layers.1.mlp.dense_h_to_4h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="485" name="self.model.gpt_neox.layers.1.mlp.dense_h_to_4h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="486" name="__module.model.gpt_neox.layers.1.mlp.dense_h_to_4h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="487" name="Constant_325209" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 16384" offset="549109892" size="65536" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="488" name="__module.model.gpt_neox.layers.1.mlp.dense_h_to_4h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="595"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="489" name="__module.model.gpt_neox.layers.1.mlp.act/aten::gelu/Gelu" type="Gelu" version="opset7"> + <data approximation_mode="ERF" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="596"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="490" name="self.model.gpt_neox.layers.1.mlp.dense_4h_to_h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 16384" offset="549175428" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="491" name="Convert_448932" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="492" name="self.model.gpt_neox.layers.1.mlp.dense_4h_to_h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="616284292" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="493" name="Convert_448935" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="494" name="self.model.gpt_neox.layers.1.mlp.dense_4h_to_h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="495" name="self.model.gpt_neox.layers.1.mlp.dense_4h_to_h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="616288388" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="496" name="self.model.gpt_neox.layers.1.mlp.dense_4h_to_h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="497" name="self.model.gpt_neox.layers.1.mlp.dense_4h_to_h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="498" name="__module.model.gpt_neox.layers.1.mlp.dense_4h_to_h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="499" name="Constant_325210" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="616296580" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="500" name="__module.model.gpt_neox.layers.1.mlp.dense_4h_to_h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="599,input.9"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="501" name="__module.model.gpt_neox.layers.1/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="601,603,hidden_states.5"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="502" name="__module.model.gpt_neox.layers.2.input_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="503" name="__module.model.gpt_neox.layers.2.input_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="504" name="Constant_325211" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="616312964" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="505" name="__module.model.gpt_neox.layers.2.input_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="506" name="Constant_325212" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="616329348" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="507" name="__module.model.gpt_neox.layers.2.input_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="613"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="508" name="self.model.gpt_neox.layers.2.attention.query_key_value.weight" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 4096" offset="616345732" size="50331648" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="509" name="Convert_448943" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="510" name="self.model.gpt_neox.layers.2.attention.query_key_value.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 1" offset="666677380" size="12288" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="511" name="Convert_448946" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="512" name="self.model.gpt_neox.layers.2.attention.query_key_value.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="513" name="self.model.gpt_neox.layers.2.attention.query_key_value.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="12288, 1" offset="666689668" size="24576" /> + <output> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="514" name="self.model.gpt_neox.layers.2.attention.query_key_value.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="515" name="self.model.gpt_neox.layers.2.attention.query_key_value.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="516" name="__module.model.gpt_neox.layers.2.attention.query_key_value/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="517" name="Constant_325213" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 12288" offset="666714244" size="49152" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="518" name="__module.model.gpt_neox.layers.2.attention.query_key_value/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="620,qkv.9"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="519" name="__module.model.gpt_neox.layers.2.attention/prim::ListConstruct/Concat" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171232" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="520" name="__module.model.gpt_neox.layers.2.attention/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="624,qkv.11"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + </output> + </layer> + <layer id="521" name="Constant_295085" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="522" name="Constant_295088" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="523" name="Constant_295091" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="524" name="__module.model.gpt_neox.layers.2.attention/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="625"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="525" name="Constant_1384" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="626"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="526" name="__module.model.gpt_neox.layers.2.attention/aten::permute/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="627,query.13"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="527" name="Constant_295097" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="528" name="Constant_295100" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="529" name="Constant_295103" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="530" name="__module.model.gpt_neox.layers.2.attention/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="634,q.5"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="531" name="self.model.gpt_neox.layers.2.attention.rotary_emb.cos_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="257171392" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.2.attention.rotary_emb.cos_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="532" name="__module.model.gpt_neox.layers.2.attention.rotary_emb/aten::slice/Unsqueeze" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="533" name="Constant_295109" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="534" name="Constant_295112" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="535" name="Constant_295115" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="536" name="__module.model.gpt_neox.layers.2.attention/aten::slice/Slice_2" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="628"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="537" name="ShapeOf_338091" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="538" name="Constant_340976" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="539" name="Constant_338093" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="540" name="Gather_338094" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="638"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="541" name="Constant_432690" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="542" name="Constant_432683" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="543" name="Constant_432685" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="544" name="Constant_432687" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="545" name="Concat_432688" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="546" name="Broadcast_432691" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="547" name="ReadValue_417330" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.2.keypresent.2.key" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.2.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="548" name="Constant_401902" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="549" name="Gather_401903" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="550" name="ShapeOf_338096" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="551" name="Constant_338097" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="552" name="Constant_338098" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="553" name="Gather_338099" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="640" /> + </output> + </layer> + <layer id="554" name="Constant_337604" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="555" name="Reshape_340909" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="556" name="__module.model.gpt_neox.layers.2.attention/aten::add_/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="639,643,644,seq_len.9"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="557" name="__module.model.gpt_neox.layers.2.attention.rotary_emb/aten::slice/Unsqueeze_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="558" name="__module.model.gpt_neox.layers.2.attention.rotary_emb/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="647,650,cos.9"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="559" name="Constant_38239" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="560" name="__module.model.gpt_neox.layers.2.attention/aten::index/Gather" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="653"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="561" name="__module.model.gpt_neox.layers.2.attention/aten::unsqueeze/Unsqueeze" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="654,cos.11"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="562" name="__module.model.gpt_neox.layers.2.attention/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="658"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="563" name="Constant_295120" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="564" name="Constant_295119" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="565" name="__module.model.gpt_neox.layers.2.attention/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="566" name="__module.model.gpt_neox.layers.2.attention/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="567" name="__module.model.gpt_neox.layers.2.attention/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="659,664" /> + </output> + </layer> + <layer id="568" name="__module.model.gpt_neox.layers.2.attention/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="569" name="__module.model.gpt_neox.layers.2.attention/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="661,662,666,667" /> + </output> + </layer> + <layer id="570" name="Constant_337606" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="571" name="__module.model.gpt_neox.layers.2.attention/aten::slice/Unsqueeze_17" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="572" name="Constant_295118" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="573" name="ScatterUpdate_295121" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="574" name="Constant_295124" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="575" name="Constant_295127" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="576" name="__module.model.gpt_neox.layers.2.attention/aten::slice/Slice_3" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="668,x2.9"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="577" name="Constant_325214" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="578" name="__module.model.gpt_neox.layers.2.attention/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="669"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="579" name="Constant_295172" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="580" name="Constant_295177" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="581" name="__module.model.gpt_neox.layers.2.attention/aten::slice/Slice_4" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="663"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="582" name="__module.model.gpt_neox.layers.2.attention/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="671"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="583" name="self.model.gpt_neox.layers.2.attention.rotary_emb.sin_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="258220060" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.2.attention.rotary_emb.sin_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="584" name="__module.model.gpt_neox.layers.2.attention.rotary_emb/aten::slice/Unsqueeze_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="585" name="__module.model.gpt_neox.layers.2.attention.rotary_emb/aten::slice/Unsqueeze_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="586" name="__module.model.gpt_neox.layers.2.attention.rotary_emb/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="648,651,sin.9"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="587" name="Constant_38242" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="588" name="__module.model.gpt_neox.layers.2.attention/aten::index/Gather_1" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="656"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="589" name="__module.model.gpt_neox.layers.2.attention/aten::unsqueeze/Unsqueeze_1" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="657,sin.11"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="590" name="__module.model.gpt_neox.layers.2.attention/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="672"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="591" name="__module.model.gpt_neox.layers.2.attention/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="673,691,701,query.15,query.17"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="592" name="Constant_1398" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="629"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="593" name="__module.model.gpt_neox.layers.2.attention/aten::permute/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="630,key.13"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="594" name="Constant_295223" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="595" name="Constant_295226" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="596" name="Constant_295229" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="597" name="__module.model.gpt_neox.layers.2.attention/aten::slice/Slice_6" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="636,k.5"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="598" name="__module.model.gpt_neox.layers.2.attention/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="674"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="599" name="Constant_295233" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="600" name="Constant_295232" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="601" name="__module.model.gpt_neox.layers.2.attention/aten::size/ShapeOf_7" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="602" name="__module.model.gpt_neox.layers.2.attention/aten::size/Constant_7" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="603" name="__module.model.gpt_neox.layers.2.attention/aten::size/Gather_7" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="675,680" /> + </output> + </layer> + <layer id="604" name="__module.model.gpt_neox.layers.2.attention/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="605" name="__module.model.gpt_neox.layers.2.attention/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="677,678,682,683" /> + </output> + </layer> + <layer id="606" name="Constant_337608" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="607" name="__module.model.gpt_neox.layers.2.attention/aten::slice/Unsqueeze_33" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="608" name="Constant_295231" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="609" name="ScatterUpdate_295234" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="610" name="Constant_295237" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="611" name="Constant_295240" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="612" name="__module.model.gpt_neox.layers.2.attention/aten::slice/Slice_7" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="684,x2.11"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="613" name="Constant_325215" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="614" name="__module.model.gpt_neox.layers.2.attention/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="685"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="615" name="Constant_295285" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="616" name="Constant_295290" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="617" name="__module.model.gpt_neox.layers.2.attention/aten::slice/Slice_8" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="679"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="618" name="__module.model.gpt_neox.layers.2.attention/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="687"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="619" name="__module.model.gpt_neox.layers.2.attention/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="688"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="620" name="__module.model.gpt_neox.layers.2.attention/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="689,693"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="621" name="__module.model.gpt_neox.layers.2.attention/aten::to/Convert_1" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.2.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="622" name="Constant_432703" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="623" name="Constant_432696" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="624" name="Constant_432698" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="625" name="Constant_432700" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="626" name="Concat_432701" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="627" name="Broadcast_432704" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="628" name="ReadValue_417332" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.2.valuepresent.2.value" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.2.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="629" name="Constant_401905" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="630" name="Gather_401906" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="631" name="Constant_295335" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="632" name="Constant_295338" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="633" name="Constant_295341" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="634" name="__module.model.gpt_neox.layers.2.attention/aten::slice/Slice_10" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="631"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="635" name="Constant_1412" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="632"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="636" name="__module.model.gpt_neox.layers.2.attention/aten::permute/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="633"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="637" name="__module.model.gpt_neox.layers.2.attention/aten::cat/Concat_5" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.2.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="638" name="__module.model.gpt_neox.layers.2.attention/aten::slice/Slice_11" type="Const" version="opset1"> + <data element_type="boolean" shape="1, 1, 2048, 2048" offset="259268636" size="4194304" /> + <output> + <port id="0" precision="BOOL" names="710"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="639" name="Constant_295345" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="640" name="Constant_295344" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="641" name="ShapeOf_338101" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="642" name="Constant_338102" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="643" name="Constant_338103" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="644" name="Gather_338104" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" /> + </output> + </layer> + <layer id="645" name="Add_338105" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="705" /> + </output> + </layer> + <layer id="646" name="ShapeOf_338172" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="647" name="Constant_338173" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="648" name="Constant_338174" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="649" name="Gather_338175" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="703" /> + </output> + </layer> + <layer id="650" name="__module.model.gpt_neox.layers.2.attention/aten::sub/Subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="707,708" /> + </output> + </layer> + <layer id="651" name="Constant_337610" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="652" name="__module.model.gpt_neox.layers.2.attention/aten::slice/Unsqueeze_44" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="653" name="Constant_295343" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="654" name="ScatterUpdate_295346" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="655" name="Constant_295347" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="656" name="Constant_337612" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="657" name="__module.model.gpt_neox.layers.2.attention/aten::slice/Unsqueeze_45" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="658" name="ScatterUpdate_295348" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="659" name="Constant_295351" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462964" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="660" name="__module.model.gpt_neox.layers.2.attention/aten::slice/Slice_12" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 0" end_mask="1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + <port id="2" precision="I64"> + <dim>3</dim> + </port> + <port id="3" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="711"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="661" name="Constant_295424" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="662" name="Constant_295425" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="663" name="Constant_295421" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="664" name="Constant_295420" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="665" name="ScatterUpdate_295426" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="666" name="Constant_295429" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="667" name="__module.model.gpt_neox.layers.2.attention/aten::slice/Slice_13" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="712,713"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="668" name="__module.model.gpt_neox.layers.2.attention/aten::where/Convert_1" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="669" name="__module.model.gpt_neox.layers.2.attention/aten::full/Convert" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="263462988" size="4" /> + <output> + <port id="0" precision="FP32" names="700" /> + </output> + </layer> + <layer id="670" name="__module.model.gpt_neox.layers.2.attention/aten::where/Select" type="Select" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32" /> + <port id="2" precision="FP32" /> + </input> + <output> + <port id="3" precision="FP32" names="714,causal_mask.9"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="671" name="Add_315132" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="672" name="ShapeOf_315133" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="673" name="Constant_338178" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="674" name="Constant_338179" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="675" name="Gather_338180" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="698"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="676" name="Constant_267981" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="677" name="Constant_267983" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="678" name="Constant_267985" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="679" name="__module.model.gpt_neox.layers.2.attention/prim::ListConstruct/Concat_1" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="715"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="680" name="Maximum_315134" type="Maximum" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="681" name="__module.model.gpt_neox.layers.2.attention/aten::add/Add_2" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="717"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="682" name="__module.model.gpt_neox.layers.2.attention/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="718,719,sdpa_result.5,tensor.9"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="683" name="Constant_1853" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="720"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="684" name="__module.model.gpt_neox.layers.2.attention/aten::permute/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="721"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="685" name="__module.model.gpt_neox.layers.2.attention/prim::ListConstruct/Concat_2" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263463020" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="686" name="__module.model.gpt_neox.layers.2.attention/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="726"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="687" name="self.model.gpt_neox.layers.2.attention.dense.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 4096" offset="666763396" size="16777216" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="688" name="Convert_448954" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="689" name="self.model.gpt_neox.layers.2.attention.dense.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="683540612" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="690" name="Convert_448957" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="691" name="self.model.gpt_neox.layers.2.attention.dense.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="692" name="self.model.gpt_neox.layers.2.attention.dense.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="683544708" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="693" name="self.model.gpt_neox.layers.2.attention.dense.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="694" name="self.model.gpt_neox.layers.2.attention.dense.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="695" name="__module.model.gpt_neox.layers.2.attention.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="696" name="Constant_325216" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="683552900" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="697" name="__module.model.gpt_neox.layers.2.attention.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="729,731,input.11"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="698" name="__module.model.gpt_neox.layers.2/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="735,attn_output.11"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="699" name="__module.model.gpt_neox.layers.2.post_attention_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="700" name="__module.model.gpt_neox.layers.2.post_attention_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="701" name="Constant_325217" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="683569284" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="702" name="__module.model.gpt_neox.layers.2.post_attention_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="703" name="Constant_325218" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="683585668" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="704" name="__module.model.gpt_neox.layers.2.post_attention_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="739"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="705" name="self.model.gpt_neox.layers.2.mlp.dense_h_to_4h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 4096" offset="683602052" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="706" name="Convert_448965" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="707" name="self.model.gpt_neox.layers.2.mlp.dense_h_to_4h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 1" offset="750710916" size="16384" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="708" name="Convert_448968" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="709" name="self.model.gpt_neox.layers.2.mlp.dense_h_to_4h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="710" name="self.model.gpt_neox.layers.2.mlp.dense_h_to_4h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="16384, 1" offset="750727300" size="32768" /> + <output> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="711" name="self.model.gpt_neox.layers.2.mlp.dense_h_to_4h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="712" name="self.model.gpt_neox.layers.2.mlp.dense_h_to_4h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="713" name="__module.model.gpt_neox.layers.2.mlp.dense_h_to_4h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="714" name="Constant_325219" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 16384" offset="750760068" size="65536" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="715" name="__module.model.gpt_neox.layers.2.mlp.dense_h_to_4h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="744"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="716" name="__module.model.gpt_neox.layers.2.mlp.act/aten::gelu/Gelu" type="Gelu" version="opset7"> + <data approximation_mode="ERF" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="745"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="717" name="self.model.gpt_neox.layers.2.mlp.dense_4h_to_h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 16384" offset="750825604" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="718" name="Convert_448976" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="719" name="self.model.gpt_neox.layers.2.mlp.dense_4h_to_h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="817934468" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="720" name="Convert_448979" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="721" name="self.model.gpt_neox.layers.2.mlp.dense_4h_to_h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="722" name="self.model.gpt_neox.layers.2.mlp.dense_4h_to_h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="817938564" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="723" name="self.model.gpt_neox.layers.2.mlp.dense_4h_to_h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="724" name="self.model.gpt_neox.layers.2.mlp.dense_4h_to_h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="725" name="__module.model.gpt_neox.layers.2.mlp.dense_4h_to_h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="726" name="Constant_325220" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="817946756" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="727" name="__module.model.gpt_neox.layers.2.mlp.dense_4h_to_h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="748,input.13"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="728" name="__module.model.gpt_neox.layers.2/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="750,752,hidden_states.7"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="729" name="__module.model.gpt_neox.layers.3.input_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="730" name="__module.model.gpt_neox.layers.3.input_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="731" name="Constant_325221" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="817963140" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="732" name="__module.model.gpt_neox.layers.3.input_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="733" name="Constant_325222" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="817979524" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="734" name="__module.model.gpt_neox.layers.3.input_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="762"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="735" name="self.model.gpt_neox.layers.3.attention.query_key_value.weight" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 4096" offset="817995908" size="50331648" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="736" name="Convert_448987" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="737" name="self.model.gpt_neox.layers.3.attention.query_key_value.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 1" offset="868327556" size="12288" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="738" name="Convert_448990" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="739" name="self.model.gpt_neox.layers.3.attention.query_key_value.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="740" name="self.model.gpt_neox.layers.3.attention.query_key_value.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="12288, 1" offset="868339844" size="24576" /> + <output> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="741" name="self.model.gpt_neox.layers.3.attention.query_key_value.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="742" name="self.model.gpt_neox.layers.3.attention.query_key_value.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="743" name="__module.model.gpt_neox.layers.3.attention.query_key_value/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="744" name="Constant_325223" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 12288" offset="868364420" size="49152" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="745" name="__module.model.gpt_neox.layers.3.attention.query_key_value/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="769,qkv.13"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="746" name="__module.model.gpt_neox.layers.3.attention/prim::ListConstruct/Concat" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171232" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="747" name="__module.model.gpt_neox.layers.3.attention/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="773,qkv.15"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + </output> + </layer> + <layer id="748" name="Constant_295436" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="749" name="Constant_295439" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="750" name="Constant_295442" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="751" name="__module.model.gpt_neox.layers.3.attention/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="774"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="752" name="Constant_1965" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="775"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="753" name="__module.model.gpt_neox.layers.3.attention/aten::permute/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="776,query.19"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="754" name="Constant_295448" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="755" name="Constant_295451" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="756" name="Constant_295454" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="757" name="__module.model.gpt_neox.layers.3.attention/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="783,q.7"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="758" name="self.model.gpt_neox.layers.3.attention.rotary_emb.cos_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="257171392" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.3.attention.rotary_emb.cos_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="759" name="__module.model.gpt_neox.layers.3.attention.rotary_emb/aten::slice/Unsqueeze" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="760" name="Constant_295460" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="761" name="Constant_295463" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="762" name="Constant_295466" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="763" name="__module.model.gpt_neox.layers.3.attention/aten::slice/Slice_2" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="777"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="764" name="ShapeOf_338182" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="765" name="Constant_340979" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="766" name="Constant_338184" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="767" name="Gather_338185" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="787"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="768" name="Constant_432716" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="769" name="Constant_432709" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="770" name="Constant_432711" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="771" name="Constant_432713" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="772" name="Concat_432714" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="773" name="Broadcast_432717" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="774" name="ReadValue_417374" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.3.keypresent.3.key" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.3.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="775" name="Constant_401908" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="776" name="Gather_401909" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="777" name="ShapeOf_338187" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="778" name="Constant_338188" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="779" name="Constant_338189" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="780" name="Gather_338190" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="789" /> + </output> + </layer> + <layer id="781" name="Constant_337614" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="782" name="Reshape_340911" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="783" name="__module.model.gpt_neox.layers.3.attention/aten::add_/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="788,792,793,seq_len.13"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="784" name="__module.model.gpt_neox.layers.3.attention.rotary_emb/aten::slice/Unsqueeze_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="785" name="__module.model.gpt_neox.layers.3.attention.rotary_emb/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="796,799,cos.13"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="786" name="Constant_38245" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="787" name="__module.model.gpt_neox.layers.3.attention/aten::index/Gather" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="802"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="788" name="__module.model.gpt_neox.layers.3.attention/aten::unsqueeze/Unsqueeze" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="803,cos.15"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="789" name="__module.model.gpt_neox.layers.3.attention/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="807"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="790" name="Constant_295471" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="791" name="Constant_295470" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="792" name="__module.model.gpt_neox.layers.3.attention/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="793" name="__module.model.gpt_neox.layers.3.attention/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="794" name="__module.model.gpt_neox.layers.3.attention/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="808,813" /> + </output> + </layer> + <layer id="795" name="__module.model.gpt_neox.layers.3.attention/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="796" name="__module.model.gpt_neox.layers.3.attention/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="810,811,815,816" /> + </output> + </layer> + <layer id="797" name="Constant_337616" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="798" name="__module.model.gpt_neox.layers.3.attention/aten::slice/Unsqueeze_17" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="799" name="Constant_295469" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="800" name="ScatterUpdate_295472" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="801" name="Constant_295475" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="802" name="Constant_295478" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="803" name="__module.model.gpt_neox.layers.3.attention/aten::slice/Slice_3" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="817,x2.13"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="804" name="Constant_325224" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="805" name="__module.model.gpt_neox.layers.3.attention/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="818"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="806" name="Constant_295523" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="807" name="Constant_295528" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="808" name="__module.model.gpt_neox.layers.3.attention/aten::slice/Slice_4" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="812"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="809" name="__module.model.gpt_neox.layers.3.attention/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="820"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="810" name="self.model.gpt_neox.layers.3.attention.rotary_emb.sin_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="258220060" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.3.attention.rotary_emb.sin_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="811" name="__module.model.gpt_neox.layers.3.attention.rotary_emb/aten::slice/Unsqueeze_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="812" name="__module.model.gpt_neox.layers.3.attention.rotary_emb/aten::slice/Unsqueeze_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="813" name="__module.model.gpt_neox.layers.3.attention.rotary_emb/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="797,800,sin.13"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="814" name="Constant_38248" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="815" name="__module.model.gpt_neox.layers.3.attention/aten::index/Gather_1" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="805"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="816" name="__module.model.gpt_neox.layers.3.attention/aten::unsqueeze/Unsqueeze_1" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="806,sin.15"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="817" name="__module.model.gpt_neox.layers.3.attention/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="821"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="818" name="__module.model.gpt_neox.layers.3.attention/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="822,840,850,query.21,query.23"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="819" name="Constant_1979" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="778"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="820" name="__module.model.gpt_neox.layers.3.attention/aten::permute/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="779,key.19"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="821" name="Constant_295574" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="822" name="Constant_295577" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="823" name="Constant_295580" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="824" name="__module.model.gpt_neox.layers.3.attention/aten::slice/Slice_6" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="785,k.7"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="825" name="__module.model.gpt_neox.layers.3.attention/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="823"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="826" name="Constant_295584" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="827" name="Constant_295583" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="828" name="__module.model.gpt_neox.layers.3.attention/aten::size/ShapeOf_7" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="829" name="__module.model.gpt_neox.layers.3.attention/aten::size/Constant_7" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="830" name="__module.model.gpt_neox.layers.3.attention/aten::size/Gather_7" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="824,829" /> + </output> + </layer> + <layer id="831" name="__module.model.gpt_neox.layers.3.attention/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="832" name="__module.model.gpt_neox.layers.3.attention/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="826,827,831,832" /> + </output> + </layer> + <layer id="833" name="Constant_337618" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="834" name="__module.model.gpt_neox.layers.3.attention/aten::slice/Unsqueeze_33" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="835" name="Constant_295582" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="836" name="ScatterUpdate_295585" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="837" name="Constant_295588" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="838" name="Constant_295591" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="839" name="__module.model.gpt_neox.layers.3.attention/aten::slice/Slice_7" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="833,x2.15"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="840" name="Constant_325225" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="841" name="__module.model.gpt_neox.layers.3.attention/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="834"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="842" name="Constant_295636" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="843" name="Constant_295641" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="844" name="__module.model.gpt_neox.layers.3.attention/aten::slice/Slice_8" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="828"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="845" name="__module.model.gpt_neox.layers.3.attention/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="836"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="846" name="__module.model.gpt_neox.layers.3.attention/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="837"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="847" name="__module.model.gpt_neox.layers.3.attention/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="838,842"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="848" name="__module.model.gpt_neox.layers.3.attention/aten::to/Convert_1" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.3.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="849" name="Constant_432729" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="850" name="Constant_432722" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="851" name="Constant_432724" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="852" name="Constant_432726" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="853" name="Concat_432727" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="854" name="Broadcast_432730" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="855" name="ReadValue_417376" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.3.valuepresent.3.value" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.3.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="856" name="Constant_401911" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="857" name="Gather_401912" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="858" name="Constant_295686" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="859" name="Constant_295689" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="860" name="Constant_295692" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="861" name="__module.model.gpt_neox.layers.3.attention/aten::slice/Slice_10" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="780"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="862" name="Constant_1993" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="781"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="863" name="__module.model.gpt_neox.layers.3.attention/aten::permute/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="782"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="864" name="__module.model.gpt_neox.layers.3.attention/aten::cat/Concat_5" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.3.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="865" name="__module.model.gpt_neox.layers.3.attention/aten::slice/Slice_11" type="Const" version="opset1"> + <data element_type="boolean" shape="1, 1, 2048, 2048" offset="259268636" size="4194304" /> + <output> + <port id="0" precision="BOOL" names="859"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="866" name="Constant_295696" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="867" name="Constant_295695" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="868" name="ShapeOf_338192" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="869" name="Constant_338193" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="870" name="Constant_338194" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="871" name="Gather_338195" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" /> + </output> + </layer> + <layer id="872" name="Add_338196" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="854" /> + </output> + </layer> + <layer id="873" name="ShapeOf_338263" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="874" name="Constant_338264" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="875" name="Constant_338265" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="876" name="Gather_338266" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="852" /> + </output> + </layer> + <layer id="877" name="__module.model.gpt_neox.layers.3.attention/aten::sub/Subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="856,857" /> + </output> + </layer> + <layer id="878" name="Constant_337620" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="879" name="__module.model.gpt_neox.layers.3.attention/aten::slice/Unsqueeze_44" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="880" name="Constant_295694" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="881" name="ScatterUpdate_295697" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="882" name="Constant_295698" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="883" name="Constant_337622" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="884" name="__module.model.gpt_neox.layers.3.attention/aten::slice/Unsqueeze_45" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="885" name="ScatterUpdate_295699" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="886" name="Constant_295702" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462964" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="887" name="__module.model.gpt_neox.layers.3.attention/aten::slice/Slice_12" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 0" end_mask="1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + <port id="2" precision="I64"> + <dim>3</dim> + </port> + <port id="3" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="860"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="888" name="Constant_295775" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="889" name="Constant_295776" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="890" name="Constant_295772" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="891" name="Constant_295771" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="892" name="ScatterUpdate_295777" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="893" name="Constant_295780" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="894" name="__module.model.gpt_neox.layers.3.attention/aten::slice/Slice_13" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="861,862"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="895" name="__module.model.gpt_neox.layers.3.attention/aten::where/Convert_1" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="896" name="__module.model.gpt_neox.layers.3.attention/aten::full/Convert" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="263462988" size="4" /> + <output> + <port id="0" precision="FP32" names="849" /> + </output> + </layer> + <layer id="897" name="__module.model.gpt_neox.layers.3.attention/aten::where/Select" type="Select" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32" /> + <port id="2" precision="FP32" /> + </input> + <output> + <port id="3" precision="FP32" names="863,causal_mask.13"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="898" name="Add_315204" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="899" name="ShapeOf_315205" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="900" name="Constant_338269" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="901" name="Constant_338270" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="902" name="Gather_338271" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="847"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="903" name="Constant_267991" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="904" name="Constant_267993" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="905" name="Constant_267995" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="906" name="__module.model.gpt_neox.layers.3.attention/prim::ListConstruct/Concat_1" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="864"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="907" name="Maximum_315206" type="Maximum" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="908" name="__module.model.gpt_neox.layers.3.attention/aten::add/Add_2" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="866"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="909" name="__module.model.gpt_neox.layers.3.attention/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="867,868,sdpa_result.7,tensor.13"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="910" name="Constant_2434" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="869"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="911" name="__module.model.gpt_neox.layers.3.attention/aten::permute/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="870"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="912" name="__module.model.gpt_neox.layers.3.attention/prim::ListConstruct/Concat_2" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263463020" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="913" name="__module.model.gpt_neox.layers.3.attention/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="875"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="914" name="self.model.gpt_neox.layers.3.attention.dense.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 4096" offset="868413572" size="16777216" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="915" name="Convert_448998" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="916" name="self.model.gpt_neox.layers.3.attention.dense.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="885190788" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="917" name="Convert_449001" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="918" name="self.model.gpt_neox.layers.3.attention.dense.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="919" name="self.model.gpt_neox.layers.3.attention.dense.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="885194884" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="920" name="self.model.gpt_neox.layers.3.attention.dense.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="921" name="self.model.gpt_neox.layers.3.attention.dense.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="922" name="__module.model.gpt_neox.layers.3.attention.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="923" name="Constant_325226" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="885203076" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="924" name="__module.model.gpt_neox.layers.3.attention.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="878,880,input.15"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="925" name="__module.model.gpt_neox.layers.3/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="884,attn_output.15"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="926" name="__module.model.gpt_neox.layers.3.post_attention_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="927" name="__module.model.gpt_neox.layers.3.post_attention_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="928" name="Constant_325227" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="885219460" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="929" name="__module.model.gpt_neox.layers.3.post_attention_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="930" name="Constant_325228" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="885235844" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="931" name="__module.model.gpt_neox.layers.3.post_attention_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="888"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="932" name="self.model.gpt_neox.layers.3.mlp.dense_h_to_4h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 4096" offset="885252228" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="933" name="Convert_449009" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="934" name="self.model.gpt_neox.layers.3.mlp.dense_h_to_4h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 1" offset="952361092" size="16384" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="935" name="Convert_449012" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="936" name="self.model.gpt_neox.layers.3.mlp.dense_h_to_4h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="937" name="self.model.gpt_neox.layers.3.mlp.dense_h_to_4h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="16384, 1" offset="952377476" size="32768" /> + <output> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="938" name="self.model.gpt_neox.layers.3.mlp.dense_h_to_4h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="939" name="self.model.gpt_neox.layers.3.mlp.dense_h_to_4h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="940" name="__module.model.gpt_neox.layers.3.mlp.dense_h_to_4h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="941" name="Constant_325229" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 16384" offset="952410244" size="65536" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="942" name="__module.model.gpt_neox.layers.3.mlp.dense_h_to_4h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="893"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="943" name="__module.model.gpt_neox.layers.3.mlp.act/aten::gelu/Gelu" type="Gelu" version="opset7"> + <data approximation_mode="ERF" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="894"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="944" name="self.model.gpt_neox.layers.3.mlp.dense_4h_to_h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 16384" offset="952475780" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="945" name="Convert_449020" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="946" name="self.model.gpt_neox.layers.3.mlp.dense_4h_to_h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="1019584644" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="947" name="Convert_449023" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="948" name="self.model.gpt_neox.layers.3.mlp.dense_4h_to_h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="949" name="self.model.gpt_neox.layers.3.mlp.dense_4h_to_h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="1019588740" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="950" name="self.model.gpt_neox.layers.3.mlp.dense_4h_to_h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="951" name="self.model.gpt_neox.layers.3.mlp.dense_4h_to_h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="952" name="__module.model.gpt_neox.layers.3.mlp.dense_4h_to_h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="953" name="Constant_325230" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="1019596932" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="954" name="__module.model.gpt_neox.layers.3.mlp.dense_4h_to_h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="897,input.17"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="955" name="__module.model.gpt_neox.layers.3/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="899,901,hidden_states.9"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="956" name="__module.model.gpt_neox.layers.4.input_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="957" name="__module.model.gpt_neox.layers.4.input_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="958" name="Constant_325231" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="1019613316" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="959" name="__module.model.gpt_neox.layers.4.input_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="960" name="Constant_325232" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="1019629700" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="961" name="__module.model.gpt_neox.layers.4.input_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="911"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="962" name="self.model.gpt_neox.layers.4.attention.query_key_value.weight" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 4096" offset="1019646084" size="50331648" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="963" name="Convert_449031" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="964" name="self.model.gpt_neox.layers.4.attention.query_key_value.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 1" offset="1069977732" size="12288" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="965" name="Convert_449034" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="966" name="self.model.gpt_neox.layers.4.attention.query_key_value.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="967" name="self.model.gpt_neox.layers.4.attention.query_key_value.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="12288, 1" offset="1069990020" size="24576" /> + <output> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="968" name="self.model.gpt_neox.layers.4.attention.query_key_value.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="969" name="self.model.gpt_neox.layers.4.attention.query_key_value.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="970" name="__module.model.gpt_neox.layers.4.attention.query_key_value/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="971" name="Constant_325233" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 12288" offset="1070014596" size="49152" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="972" name="__module.model.gpt_neox.layers.4.attention.query_key_value/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="918,qkv.17"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="973" name="__module.model.gpt_neox.layers.4.attention/prim::ListConstruct/Concat" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171232" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="974" name="__module.model.gpt_neox.layers.4.attention/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="922,qkv.19"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + </output> + </layer> + <layer id="975" name="Constant_295787" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="976" name="Constant_295790" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="977" name="Constant_295793" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="978" name="__module.model.gpt_neox.layers.4.attention/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="923"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="979" name="Constant_2546" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="924"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="980" name="__module.model.gpt_neox.layers.4.attention/aten::permute/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="925,query.25"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="981" name="Constant_295799" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="982" name="Constant_295802" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="983" name="Constant_295805" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="984" name="__module.model.gpt_neox.layers.4.attention/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="932,q.9"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="985" name="self.model.gpt_neox.layers.4.attention.rotary_emb.cos_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="257171392" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.4.attention.rotary_emb.cos_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="986" name="__module.model.gpt_neox.layers.4.attention.rotary_emb/aten::slice/Unsqueeze" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="987" name="Constant_295811" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="988" name="Constant_295814" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="989" name="Constant_295817" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="990" name="__module.model.gpt_neox.layers.4.attention/aten::slice/Slice_2" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="926"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="991" name="ShapeOf_338273" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="992" name="Constant_340982" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="993" name="Constant_338275" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="994" name="Gather_338276" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="936"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="995" name="Constant_432742" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="996" name="Constant_432735" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="997" name="Constant_432737" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="998" name="Constant_432739" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="999" name="Concat_432740" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1000" name="Broadcast_432743" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1001" name="ReadValue_417386" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.4.keypresent.4.key" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.4.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1002" name="Constant_401914" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1003" name="Gather_401915" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1004" name="ShapeOf_338278" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1005" name="Constant_338279" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1006" name="Constant_338280" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1007" name="Gather_338281" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="938" /> + </output> + </layer> + <layer id="1008" name="Constant_337624" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1009" name="Reshape_340913" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1010" name="__module.model.gpt_neox.layers.4.attention/aten::add_/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="937,941,942,seq_len.17"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1011" name="__module.model.gpt_neox.layers.4.attention.rotary_emb/aten::slice/Unsqueeze_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1012" name="__module.model.gpt_neox.layers.4.attention.rotary_emb/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="945,948,cos.17"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1013" name="Constant_38251" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="1014" name="__module.model.gpt_neox.layers.4.attention/aten::index/Gather" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="951"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1015" name="__module.model.gpt_neox.layers.4.attention/aten::unsqueeze/Unsqueeze" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="952,cos.19"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1016" name="__module.model.gpt_neox.layers.4.attention/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="956"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1017" name="Constant_295822" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1018" name="Constant_295821" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1019" name="__module.model.gpt_neox.layers.4.attention/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1020" name="__module.model.gpt_neox.layers.4.attention/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="1021" name="__module.model.gpt_neox.layers.4.attention/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="957,962" /> + </output> + </layer> + <layer id="1022" name="__module.model.gpt_neox.layers.4.attention/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="1023" name="__module.model.gpt_neox.layers.4.attention/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="959,960,964,965" /> + </output> + </layer> + <layer id="1024" name="Constant_337626" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1025" name="__module.model.gpt_neox.layers.4.attention/aten::slice/Unsqueeze_17" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1026" name="Constant_295820" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1027" name="ScatterUpdate_295823" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1028" name="Constant_295826" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1029" name="Constant_295829" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1030" name="__module.model.gpt_neox.layers.4.attention/aten::slice/Slice_3" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="966,x2.17"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="1031" name="Constant_325234" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1032" name="__module.model.gpt_neox.layers.4.attention/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="967"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="1033" name="Constant_295874" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1034" name="Constant_295879" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1035" name="__module.model.gpt_neox.layers.4.attention/aten::slice/Slice_4" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="961"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="1036" name="__module.model.gpt_neox.layers.4.attention/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="969"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1037" name="self.model.gpt_neox.layers.4.attention.rotary_emb.sin_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="258220060" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.4.attention.rotary_emb.sin_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1038" name="__module.model.gpt_neox.layers.4.attention.rotary_emb/aten::slice/Unsqueeze_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1039" name="__module.model.gpt_neox.layers.4.attention.rotary_emb/aten::slice/Unsqueeze_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1040" name="__module.model.gpt_neox.layers.4.attention.rotary_emb/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="946,949,sin.17"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1041" name="Constant_38254" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="1042" name="__module.model.gpt_neox.layers.4.attention/aten::index/Gather_1" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="954"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1043" name="__module.model.gpt_neox.layers.4.attention/aten::unsqueeze/Unsqueeze_1" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="955,sin.19"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1044" name="__module.model.gpt_neox.layers.4.attention/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="970"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1045" name="__module.model.gpt_neox.layers.4.attention/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="971,989,999,query.27,query.29"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1046" name="Constant_2560" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="927"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1047" name="__module.model.gpt_neox.layers.4.attention/aten::permute/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="928,key.25"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1048" name="Constant_295925" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1049" name="Constant_295928" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1050" name="Constant_295931" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1051" name="__module.model.gpt_neox.layers.4.attention/aten::slice/Slice_6" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="934,k.9"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1052" name="__module.model.gpt_neox.layers.4.attention/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="972"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1053" name="Constant_295935" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1054" name="Constant_295934" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1055" name="__module.model.gpt_neox.layers.4.attention/aten::size/ShapeOf_7" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1056" name="__module.model.gpt_neox.layers.4.attention/aten::size/Constant_7" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="1057" name="__module.model.gpt_neox.layers.4.attention/aten::size/Gather_7" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="973,978" /> + </output> + </layer> + <layer id="1058" name="__module.model.gpt_neox.layers.4.attention/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="1059" name="__module.model.gpt_neox.layers.4.attention/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="975,976,980,981" /> + </output> + </layer> + <layer id="1060" name="Constant_337628" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1061" name="__module.model.gpt_neox.layers.4.attention/aten::slice/Unsqueeze_33" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1062" name="Constant_295933" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1063" name="ScatterUpdate_295936" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1064" name="Constant_295939" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1065" name="Constant_295942" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1066" name="__module.model.gpt_neox.layers.4.attention/aten::slice/Slice_7" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="982,x2.19"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="1067" name="Constant_325235" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1068" name="__module.model.gpt_neox.layers.4.attention/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="983"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="1069" name="Constant_295987" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1070" name="Constant_295992" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1071" name="__module.model.gpt_neox.layers.4.attention/aten::slice/Slice_8" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="977"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="1072" name="__module.model.gpt_neox.layers.4.attention/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="985"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1073" name="__module.model.gpt_neox.layers.4.attention/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="986"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1074" name="__module.model.gpt_neox.layers.4.attention/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="987,991"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1075" name="__module.model.gpt_neox.layers.4.attention/aten::to/Convert_1" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.4.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1076" name="Constant_432755" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="1077" name="Constant_432748" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1078" name="Constant_432750" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1079" name="Constant_432752" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1080" name="Concat_432753" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1081" name="Broadcast_432756" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1082" name="ReadValue_417388" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.4.valuepresent.4.value" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.4.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1083" name="Constant_401917" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1084" name="Gather_401918" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1085" name="Constant_296037" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1086" name="Constant_296040" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1087" name="Constant_296043" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1088" name="__module.model.gpt_neox.layers.4.attention/aten::slice/Slice_10" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="929"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1089" name="Constant_2574" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="930"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1090" name="__module.model.gpt_neox.layers.4.attention/aten::permute/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="931"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1091" name="__module.model.gpt_neox.layers.4.attention/aten::cat/Concat_5" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.4.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1092" name="__module.model.gpt_neox.layers.4.attention/aten::slice/Slice_11" type="Const" version="opset1"> + <data element_type="boolean" shape="1, 1, 2048, 2048" offset="259268636" size="4194304" /> + <output> + <port id="0" precision="BOOL" names="1008"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="1093" name="Constant_296047" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="1094" name="Constant_296046" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1095" name="ShapeOf_338283" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1096" name="Constant_338284" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1097" name="Constant_338285" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1098" name="Gather_338286" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" /> + </output> + </layer> + <layer id="1099" name="Add_338287" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="1003" /> + </output> + </layer> + <layer id="1100" name="ShapeOf_338354" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1101" name="Constant_338355" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1102" name="Constant_338356" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1103" name="Gather_338357" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="1001" /> + </output> + </layer> + <layer id="1104" name="__module.model.gpt_neox.layers.4.attention/aten::sub/Subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="1005,1006" /> + </output> + </layer> + <layer id="1105" name="Constant_337630" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1106" name="__module.model.gpt_neox.layers.4.attention/aten::slice/Unsqueeze_44" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1107" name="Constant_296045" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1108" name="ScatterUpdate_296048" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="1109" name="Constant_296049" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="1110" name="Constant_337632" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1111" name="__module.model.gpt_neox.layers.4.attention/aten::slice/Unsqueeze_45" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1112" name="ScatterUpdate_296050" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="1113" name="Constant_296053" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462964" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="1114" name="__module.model.gpt_neox.layers.4.attention/aten::slice/Slice_12" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 0" end_mask="1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + <port id="2" precision="I64"> + <dim>3</dim> + </port> + <port id="3" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="1009"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="1115" name="Constant_296126" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1116" name="Constant_296127" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1117" name="Constant_296123" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1118" name="Constant_296122" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1119" name="ScatterUpdate_296128" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1120" name="Constant_296131" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1121" name="__module.model.gpt_neox.layers.4.attention/aten::slice/Slice_13" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="1010,1011"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="1122" name="__module.model.gpt_neox.layers.4.attention/aten::where/Convert_1" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="1123" name="__module.model.gpt_neox.layers.4.attention/aten::full/Convert" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="263462988" size="4" /> + <output> + <port id="0" precision="FP32" names="998" /> + </output> + </layer> + <layer id="1124" name="__module.model.gpt_neox.layers.4.attention/aten::where/Select" type="Select" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32" /> + <port id="2" precision="FP32" /> + </input> + <output> + <port id="3" precision="FP32" names="1012,causal_mask.17"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="1125" name="Add_315276" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="1126" name="ShapeOf_315277" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1127" name="Constant_338360" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1128" name="Constant_338361" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1129" name="Gather_338362" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="996"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1130" name="Constant_268001" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1131" name="Constant_268003" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1132" name="Constant_268005" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1133" name="__module.model.gpt_neox.layers.4.attention/prim::ListConstruct/Concat_1" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="1013"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1134" name="Maximum_315278" type="Maximum" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1135" name="__module.model.gpt_neox.layers.4.attention/aten::add/Add_2" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1015"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="1136" name="__module.model.gpt_neox.layers.4.attention/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1016,1017,sdpa_result.9,tensor.17"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1137" name="Constant_3015" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="1018"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1138" name="__module.model.gpt_neox.layers.4.attention/aten::permute/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1019"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1139" name="__module.model.gpt_neox.layers.4.attention/prim::ListConstruct/Concat_2" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263463020" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="1140" name="__module.model.gpt_neox.layers.4.attention/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1024"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1141" name="self.model.gpt_neox.layers.4.attention.dense.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 4096" offset="1070063748" size="16777216" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1142" name="Convert_449042" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1143" name="self.model.gpt_neox.layers.4.attention.dense.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="1086840964" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1144" name="Convert_449045" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1145" name="self.model.gpt_neox.layers.4.attention.dense.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1146" name="self.model.gpt_neox.layers.4.attention.dense.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="1086845060" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1147" name="self.model.gpt_neox.layers.4.attention.dense.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1148" name="self.model.gpt_neox.layers.4.attention.dense.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1149" name="__module.model.gpt_neox.layers.4.attention.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1150" name="Constant_325236" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="1086853252" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1151" name="__module.model.gpt_neox.layers.4.attention.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1027,1029,input.19"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1152" name="__module.model.gpt_neox.layers.4/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1033,attn_output.19"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1153" name="__module.model.gpt_neox.layers.4.post_attention_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1154" name="__module.model.gpt_neox.layers.4.post_attention_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1155" name="Constant_325237" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="1086869636" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1156" name="__module.model.gpt_neox.layers.4.post_attention_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1157" name="Constant_325238" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="1086886020" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1158" name="__module.model.gpt_neox.layers.4.post_attention_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1037"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1159" name="self.model.gpt_neox.layers.4.mlp.dense_h_to_4h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 4096" offset="1086902404" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1160" name="Convert_449053" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1161" name="self.model.gpt_neox.layers.4.mlp.dense_h_to_4h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 1" offset="1154011268" size="16384" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1162" name="Convert_449056" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1163" name="self.model.gpt_neox.layers.4.mlp.dense_h_to_4h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1164" name="self.model.gpt_neox.layers.4.mlp.dense_h_to_4h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="16384, 1" offset="1154027652" size="32768" /> + <output> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1165" name="self.model.gpt_neox.layers.4.mlp.dense_h_to_4h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1166" name="self.model.gpt_neox.layers.4.mlp.dense_h_to_4h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1167" name="__module.model.gpt_neox.layers.4.mlp.dense_h_to_4h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="1168" name="Constant_325239" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 16384" offset="1154060420" size="65536" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="1169" name="__module.model.gpt_neox.layers.4.mlp.dense_h_to_4h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1042"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="1170" name="__module.model.gpt_neox.layers.4.mlp.act/aten::gelu/Gelu" type="Gelu" version="opset7"> + <data approximation_mode="ERF" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="1043"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="1171" name="self.model.gpt_neox.layers.4.mlp.dense_4h_to_h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 16384" offset="1154125956" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="1172" name="Convert_449064" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="1173" name="self.model.gpt_neox.layers.4.mlp.dense_4h_to_h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="1221234820" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1174" name="Convert_449067" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1175" name="self.model.gpt_neox.layers.4.mlp.dense_4h_to_h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="1176" name="self.model.gpt_neox.layers.4.mlp.dense_4h_to_h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="1221238916" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1177" name="self.model.gpt_neox.layers.4.mlp.dense_4h_to_h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="1178" name="self.model.gpt_neox.layers.4.mlp.dense_4h_to_h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="1179" name="__module.model.gpt_neox.layers.4.mlp.dense_4h_to_h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1180" name="Constant_325240" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="1221247108" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1181" name="__module.model.gpt_neox.layers.4.mlp.dense_4h_to_h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1046,input.21"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1182" name="__module.model.gpt_neox.layers.4/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1048,1050,hidden_states.11"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1183" name="__module.model.gpt_neox.layers.5.input_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1184" name="__module.model.gpt_neox.layers.5.input_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1185" name="Constant_325241" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="1221263492" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1186" name="__module.model.gpt_neox.layers.5.input_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1187" name="Constant_325242" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="1221279876" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1188" name="__module.model.gpt_neox.layers.5.input_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1060"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1189" name="self.model.gpt_neox.layers.5.attention.query_key_value.weight" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 4096" offset="1221296260" size="50331648" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1190" name="Convert_449075" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1191" name="self.model.gpt_neox.layers.5.attention.query_key_value.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 1" offset="1271627908" size="12288" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1192" name="Convert_449078" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1193" name="self.model.gpt_neox.layers.5.attention.query_key_value.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1194" name="self.model.gpt_neox.layers.5.attention.query_key_value.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="12288, 1" offset="1271640196" size="24576" /> + <output> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1195" name="self.model.gpt_neox.layers.5.attention.query_key_value.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1196" name="self.model.gpt_neox.layers.5.attention.query_key_value.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1197" name="__module.model.gpt_neox.layers.5.attention.query_key_value/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="1198" name="Constant_325243" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 12288" offset="1271664772" size="49152" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="1199" name="__module.model.gpt_neox.layers.5.attention.query_key_value/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1067,qkv.21"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="1200" name="__module.model.gpt_neox.layers.5.attention/prim::ListConstruct/Concat" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171232" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1201" name="__module.model.gpt_neox.layers.5.attention/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1071,qkv.23"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + </output> + </layer> + <layer id="1202" name="Constant_296138" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1203" name="Constant_296141" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1204" name="Constant_296144" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1205" name="__module.model.gpt_neox.layers.5.attention/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1072"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1206" name="Constant_3127" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="1073"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1207" name="__module.model.gpt_neox.layers.5.attention/aten::permute/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1074,query.31"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1208" name="Constant_296150" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1209" name="Constant_296153" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1210" name="Constant_296156" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1211" name="__module.model.gpt_neox.layers.5.attention/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1081,q.11"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1212" name="self.model.gpt_neox.layers.5.attention.rotary_emb.cos_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="257171392" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.5.attention.rotary_emb.cos_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1213" name="__module.model.gpt_neox.layers.5.attention.rotary_emb/aten::slice/Unsqueeze" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1214" name="Constant_296162" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1215" name="Constant_296165" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1216" name="Constant_296168" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1217" name="__module.model.gpt_neox.layers.5.attention/aten::slice/Slice_2" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1075"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1218" name="ShapeOf_338364" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1219" name="Constant_340985" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1220" name="Constant_338366" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1221" name="Gather_338367" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="1085"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1222" name="Constant_432768" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="1223" name="Constant_432761" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1224" name="Constant_432763" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1225" name="Constant_432765" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1226" name="Concat_432766" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1227" name="Broadcast_432769" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1228" name="ReadValue_417390" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.5.keypresent.5.key" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.5.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1229" name="Constant_401920" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1230" name="Gather_401921" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1231" name="ShapeOf_338369" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1232" name="Constant_338370" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1233" name="Constant_338371" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1234" name="Gather_338372" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="1087" /> + </output> + </layer> + <layer id="1235" name="Constant_337634" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1236" name="Reshape_340915" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1237" name="__module.model.gpt_neox.layers.5.attention/aten::add_/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="1086,1090,1091,seq_len.21"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1238" name="__module.model.gpt_neox.layers.5.attention.rotary_emb/aten::slice/Unsqueeze_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1239" name="__module.model.gpt_neox.layers.5.attention.rotary_emb/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1094,1097,cos.21"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1240" name="Constant_38257" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="1241" name="__module.model.gpt_neox.layers.5.attention/aten::index/Gather" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="1100"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1242" name="__module.model.gpt_neox.layers.5.attention/aten::unsqueeze/Unsqueeze" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="1101,cos.23"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1243" name="__module.model.gpt_neox.layers.5.attention/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1105"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1244" name="Constant_296173" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1245" name="Constant_296172" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1246" name="__module.model.gpt_neox.layers.5.attention/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1247" name="__module.model.gpt_neox.layers.5.attention/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="1248" name="__module.model.gpt_neox.layers.5.attention/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="1106,1111" /> + </output> + </layer> + <layer id="1249" name="__module.model.gpt_neox.layers.5.attention/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="1250" name="__module.model.gpt_neox.layers.5.attention/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="1108,1109,1113,1114" /> + </output> + </layer> + <layer id="1251" name="Constant_337636" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1252" name="__module.model.gpt_neox.layers.5.attention/aten::slice/Unsqueeze_17" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1253" name="Constant_296171" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1254" name="ScatterUpdate_296174" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1255" name="Constant_296177" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1256" name="Constant_296180" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1257" name="__module.model.gpt_neox.layers.5.attention/aten::slice/Slice_3" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1115,x2.21"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="1258" name="Constant_325244" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1259" name="__module.model.gpt_neox.layers.5.attention/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1116"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="1260" name="Constant_296225" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1261" name="Constant_296230" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1262" name="__module.model.gpt_neox.layers.5.attention/aten::slice/Slice_4" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1110"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="1263" name="__module.model.gpt_neox.layers.5.attention/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1118"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1264" name="self.model.gpt_neox.layers.5.attention.rotary_emb.sin_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="258220060" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.5.attention.rotary_emb.sin_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1265" name="__module.model.gpt_neox.layers.5.attention.rotary_emb/aten::slice/Unsqueeze_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1266" name="__module.model.gpt_neox.layers.5.attention.rotary_emb/aten::slice/Unsqueeze_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1267" name="__module.model.gpt_neox.layers.5.attention.rotary_emb/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1095,1098,sin.21"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1268" name="Constant_38260" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="1269" name="__module.model.gpt_neox.layers.5.attention/aten::index/Gather_1" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="1103"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1270" name="__module.model.gpt_neox.layers.5.attention/aten::unsqueeze/Unsqueeze_1" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="1104,sin.23"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1271" name="__module.model.gpt_neox.layers.5.attention/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1119"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1272" name="__module.model.gpt_neox.layers.5.attention/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1120,1138,1148,query.33,query.35"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1273" name="Constant_3141" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="1076"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1274" name="__module.model.gpt_neox.layers.5.attention/aten::permute/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1077,key.31"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1275" name="Constant_296276" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1276" name="Constant_296279" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1277" name="Constant_296282" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1278" name="__module.model.gpt_neox.layers.5.attention/aten::slice/Slice_6" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1083,k.11"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1279" name="__module.model.gpt_neox.layers.5.attention/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1121"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1280" name="Constant_296286" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1281" name="Constant_296285" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1282" name="__module.model.gpt_neox.layers.5.attention/aten::size/ShapeOf_7" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1283" name="__module.model.gpt_neox.layers.5.attention/aten::size/Constant_7" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="1284" name="__module.model.gpt_neox.layers.5.attention/aten::size/Gather_7" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="1122,1127" /> + </output> + </layer> + <layer id="1285" name="__module.model.gpt_neox.layers.5.attention/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="1286" name="__module.model.gpt_neox.layers.5.attention/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="1124,1125,1129,1130" /> + </output> + </layer> + <layer id="1287" name="Constant_337638" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1288" name="__module.model.gpt_neox.layers.5.attention/aten::slice/Unsqueeze_33" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1289" name="Constant_296284" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1290" name="ScatterUpdate_296287" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1291" name="Constant_296290" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1292" name="Constant_296293" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1293" name="__module.model.gpt_neox.layers.5.attention/aten::slice/Slice_7" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1131,x2.23"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="1294" name="Constant_325245" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1295" name="__module.model.gpt_neox.layers.5.attention/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1132"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="1296" name="Constant_296338" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1297" name="Constant_296343" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1298" name="__module.model.gpt_neox.layers.5.attention/aten::slice/Slice_8" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1126"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="1299" name="__module.model.gpt_neox.layers.5.attention/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1134"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1300" name="__module.model.gpt_neox.layers.5.attention/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1135"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1301" name="__module.model.gpt_neox.layers.5.attention/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1136,1140"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1302" name="__module.model.gpt_neox.layers.5.attention/aten::to/Convert_1" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.5.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1303" name="Constant_432781" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="1304" name="Constant_432774" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1305" name="Constant_432776" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1306" name="Constant_432778" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1307" name="Concat_432779" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1308" name="Broadcast_432782" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1309" name="ReadValue_417392" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.5.valuepresent.5.value" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.5.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1310" name="Constant_401923" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1311" name="Gather_401924" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1312" name="Constant_296388" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1313" name="Constant_296391" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1314" name="Constant_296394" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1315" name="__module.model.gpt_neox.layers.5.attention/aten::slice/Slice_10" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1078"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1316" name="Constant_3155" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="1079"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1317" name="__module.model.gpt_neox.layers.5.attention/aten::permute/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1080"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1318" name="__module.model.gpt_neox.layers.5.attention/aten::cat/Concat_5" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.5.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1319" name="__module.model.gpt_neox.layers.5.attention/aten::slice/Slice_11" type="Const" version="opset1"> + <data element_type="boolean" shape="1, 1, 2048, 2048" offset="259268636" size="4194304" /> + <output> + <port id="0" precision="BOOL" names="1157"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="1320" name="Constant_296398" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="1321" name="Constant_296397" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1322" name="ShapeOf_338374" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1323" name="Constant_338375" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1324" name="Constant_338376" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1325" name="Gather_338377" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" /> + </output> + </layer> + <layer id="1326" name="Add_338378" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="1152" /> + </output> + </layer> + <layer id="1327" name="ShapeOf_338445" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1328" name="Constant_338446" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1329" name="Constant_338447" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1330" name="Gather_338448" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="1150" /> + </output> + </layer> + <layer id="1331" name="__module.model.gpt_neox.layers.5.attention/aten::sub/Subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="1154,1155" /> + </output> + </layer> + <layer id="1332" name="Constant_337640" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1333" name="__module.model.gpt_neox.layers.5.attention/aten::slice/Unsqueeze_44" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1334" name="Constant_296396" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1335" name="ScatterUpdate_296399" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="1336" name="Constant_296400" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="1337" name="Constant_337642" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1338" name="__module.model.gpt_neox.layers.5.attention/aten::slice/Unsqueeze_45" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1339" name="ScatterUpdate_296401" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="1340" name="Constant_296404" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462964" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="1341" name="__module.model.gpt_neox.layers.5.attention/aten::slice/Slice_12" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 0" end_mask="1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + <port id="2" precision="I64"> + <dim>3</dim> + </port> + <port id="3" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="1158"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="1342" name="Constant_296477" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1343" name="Constant_296478" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1344" name="Constant_296474" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1345" name="Constant_296473" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1346" name="ScatterUpdate_296479" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1347" name="Constant_296482" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1348" name="__module.model.gpt_neox.layers.5.attention/aten::slice/Slice_13" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="1159,1160"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="1349" name="__module.model.gpt_neox.layers.5.attention/aten::where/Convert_1" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="1350" name="__module.model.gpt_neox.layers.5.attention/aten::full/Convert" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="263462988" size="4" /> + <output> + <port id="0" precision="FP32" names="1147" /> + </output> + </layer> + <layer id="1351" name="__module.model.gpt_neox.layers.5.attention/aten::where/Select" type="Select" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32" /> + <port id="2" precision="FP32" /> + </input> + <output> + <port id="3" precision="FP32" names="1161,causal_mask.21"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="1352" name="Add_315348" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="1353" name="ShapeOf_315349" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1354" name="Constant_338451" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1355" name="Constant_338452" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1356" name="Gather_338453" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="1145"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1357" name="Constant_268011" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1358" name="Constant_268013" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1359" name="Constant_268015" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1360" name="__module.model.gpt_neox.layers.5.attention/prim::ListConstruct/Concat_1" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="1162"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1361" name="Maximum_315350" type="Maximum" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1362" name="__module.model.gpt_neox.layers.5.attention/aten::add/Add_2" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1164"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="1363" name="__module.model.gpt_neox.layers.5.attention/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1165,1166,sdpa_result.11,tensor.21"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1364" name="Constant_3596" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="1167"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1365" name="__module.model.gpt_neox.layers.5.attention/aten::permute/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1168"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1366" name="__module.model.gpt_neox.layers.5.attention/prim::ListConstruct/Concat_2" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263463020" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="1367" name="__module.model.gpt_neox.layers.5.attention/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1173"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1368" name="self.model.gpt_neox.layers.5.attention.dense.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 4096" offset="1271713924" size="16777216" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1369" name="Convert_449086" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1370" name="self.model.gpt_neox.layers.5.attention.dense.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="1288491140" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1371" name="Convert_449089" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1372" name="self.model.gpt_neox.layers.5.attention.dense.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1373" name="self.model.gpt_neox.layers.5.attention.dense.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="1288495236" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1374" name="self.model.gpt_neox.layers.5.attention.dense.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1375" name="self.model.gpt_neox.layers.5.attention.dense.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1376" name="__module.model.gpt_neox.layers.5.attention.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1377" name="Constant_325246" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="1288503428" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1378" name="__module.model.gpt_neox.layers.5.attention.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1176,1178,input.23"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1379" name="__module.model.gpt_neox.layers.5/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1182,attn_output.23"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1380" name="__module.model.gpt_neox.layers.5.post_attention_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1381" name="__module.model.gpt_neox.layers.5.post_attention_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1382" name="Constant_325247" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="1288519812" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1383" name="__module.model.gpt_neox.layers.5.post_attention_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1384" name="Constant_325248" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="1288536196" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1385" name="__module.model.gpt_neox.layers.5.post_attention_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1186"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1386" name="self.model.gpt_neox.layers.5.mlp.dense_h_to_4h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 4096" offset="1288552580" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1387" name="Convert_449097" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1388" name="self.model.gpt_neox.layers.5.mlp.dense_h_to_4h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 1" offset="1355661444" size="16384" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1389" name="Convert_449100" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1390" name="self.model.gpt_neox.layers.5.mlp.dense_h_to_4h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1391" name="self.model.gpt_neox.layers.5.mlp.dense_h_to_4h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="16384, 1" offset="1355677828" size="32768" /> + <output> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1392" name="self.model.gpt_neox.layers.5.mlp.dense_h_to_4h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1393" name="self.model.gpt_neox.layers.5.mlp.dense_h_to_4h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1394" name="__module.model.gpt_neox.layers.5.mlp.dense_h_to_4h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="1395" name="Constant_325249" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 16384" offset="1355710596" size="65536" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="1396" name="__module.model.gpt_neox.layers.5.mlp.dense_h_to_4h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1191"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="1397" name="__module.model.gpt_neox.layers.5.mlp.act/aten::gelu/Gelu" type="Gelu" version="opset7"> + <data approximation_mode="ERF" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="1192"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="1398" name="self.model.gpt_neox.layers.5.mlp.dense_4h_to_h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 16384" offset="1355776132" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="1399" name="Convert_449108" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="1400" name="self.model.gpt_neox.layers.5.mlp.dense_4h_to_h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="1422884996" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1401" name="Convert_449111" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1402" name="self.model.gpt_neox.layers.5.mlp.dense_4h_to_h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="1403" name="self.model.gpt_neox.layers.5.mlp.dense_4h_to_h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="1422889092" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1404" name="self.model.gpt_neox.layers.5.mlp.dense_4h_to_h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="1405" name="self.model.gpt_neox.layers.5.mlp.dense_4h_to_h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="1406" name="__module.model.gpt_neox.layers.5.mlp.dense_4h_to_h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1407" name="Constant_325250" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="1422897284" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1408" name="__module.model.gpt_neox.layers.5.mlp.dense_4h_to_h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1195,input.25"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1409" name="__module.model.gpt_neox.layers.5/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1197,1199,hidden_states.13"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1410" name="__module.model.gpt_neox.layers.6.input_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1411" name="__module.model.gpt_neox.layers.6.input_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1412" name="Constant_325251" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="1422913668" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1413" name="__module.model.gpt_neox.layers.6.input_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1414" name="Constant_325252" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="1422930052" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1415" name="__module.model.gpt_neox.layers.6.input_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1209"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1416" name="self.model.gpt_neox.layers.6.attention.query_key_value.weight" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 4096" offset="1422946436" size="50331648" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1417" name="Convert_449119" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1418" name="self.model.gpt_neox.layers.6.attention.query_key_value.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 1" offset="1473278084" size="12288" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1419" name="Convert_449122" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1420" name="self.model.gpt_neox.layers.6.attention.query_key_value.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1421" name="self.model.gpt_neox.layers.6.attention.query_key_value.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="12288, 1" offset="1473290372" size="24576" /> + <output> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1422" name="self.model.gpt_neox.layers.6.attention.query_key_value.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1423" name="self.model.gpt_neox.layers.6.attention.query_key_value.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1424" name="__module.model.gpt_neox.layers.6.attention.query_key_value/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="1425" name="Constant_325253" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 12288" offset="1473314948" size="49152" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="1426" name="__module.model.gpt_neox.layers.6.attention.query_key_value/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1216,qkv.25"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="1427" name="__module.model.gpt_neox.layers.6.attention/prim::ListConstruct/Concat" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171232" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1428" name="__module.model.gpt_neox.layers.6.attention/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1220,qkv.27"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + </output> + </layer> + <layer id="1429" name="Constant_296489" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1430" name="Constant_296492" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1431" name="Constant_296495" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1432" name="__module.model.gpt_neox.layers.6.attention/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1221"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1433" name="Constant_3708" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="1222"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1434" name="__module.model.gpt_neox.layers.6.attention/aten::permute/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1223,query.37"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1435" name="Constant_296501" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1436" name="Constant_296504" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1437" name="Constant_296507" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1438" name="__module.model.gpt_neox.layers.6.attention/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1230,q.13"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1439" name="self.model.gpt_neox.layers.6.attention.rotary_emb.cos_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="257171392" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.6.attention.rotary_emb.cos_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1440" name="__module.model.gpt_neox.layers.6.attention.rotary_emb/aten::slice/Unsqueeze" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1441" name="Constant_296513" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1442" name="Constant_296516" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1443" name="Constant_296519" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1444" name="__module.model.gpt_neox.layers.6.attention/aten::slice/Slice_2" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1224"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1445" name="ShapeOf_338455" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1446" name="Constant_340988" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1447" name="Constant_338457" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1448" name="Gather_338458" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="1234"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1449" name="Constant_432794" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="1450" name="Constant_432787" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1451" name="Constant_432789" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1452" name="Constant_432791" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1453" name="Concat_432792" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1454" name="Broadcast_432795" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1455" name="ReadValue_417394" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.6.keypresent.6.key" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.6.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1456" name="Constant_401926" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1457" name="Gather_401927" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1458" name="ShapeOf_338460" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1459" name="Constant_338461" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1460" name="Constant_338462" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1461" name="Gather_338463" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="1236" /> + </output> + </layer> + <layer id="1462" name="Constant_337644" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1463" name="Reshape_340917" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1464" name="__module.model.gpt_neox.layers.6.attention/aten::add_/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="1235,1239,1240,seq_len.25"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1465" name="__module.model.gpt_neox.layers.6.attention.rotary_emb/aten::slice/Unsqueeze_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1466" name="__module.model.gpt_neox.layers.6.attention.rotary_emb/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1243,1246,cos.25"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1467" name="Constant_38263" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="1468" name="__module.model.gpt_neox.layers.6.attention/aten::index/Gather" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="1249"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1469" name="__module.model.gpt_neox.layers.6.attention/aten::unsqueeze/Unsqueeze" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="1250,cos.27"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1470" name="__module.model.gpt_neox.layers.6.attention/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1254"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1471" name="Constant_296524" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1472" name="Constant_296523" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1473" name="__module.model.gpt_neox.layers.6.attention/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1474" name="__module.model.gpt_neox.layers.6.attention/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="1475" name="__module.model.gpt_neox.layers.6.attention/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="1255,1260" /> + </output> + </layer> + <layer id="1476" name="__module.model.gpt_neox.layers.6.attention/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="1477" name="__module.model.gpt_neox.layers.6.attention/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="1257,1258,1262,1263" /> + </output> + </layer> + <layer id="1478" name="Constant_337646" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1479" name="__module.model.gpt_neox.layers.6.attention/aten::slice/Unsqueeze_17" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1480" name="Constant_296522" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1481" name="ScatterUpdate_296525" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1482" name="Constant_296528" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1483" name="Constant_296531" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1484" name="__module.model.gpt_neox.layers.6.attention/aten::slice/Slice_3" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1264,x2.25"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="1485" name="Constant_325254" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1486" name="__module.model.gpt_neox.layers.6.attention/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1265"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="1487" name="Constant_296576" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1488" name="Constant_296581" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1489" name="__module.model.gpt_neox.layers.6.attention/aten::slice/Slice_4" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1259"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="1490" name="__module.model.gpt_neox.layers.6.attention/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1267"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1491" name="self.model.gpt_neox.layers.6.attention.rotary_emb.sin_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="258220060" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.6.attention.rotary_emb.sin_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1492" name="__module.model.gpt_neox.layers.6.attention.rotary_emb/aten::slice/Unsqueeze_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1493" name="__module.model.gpt_neox.layers.6.attention.rotary_emb/aten::slice/Unsqueeze_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1494" name="__module.model.gpt_neox.layers.6.attention.rotary_emb/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1244,1247,sin.25"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1495" name="Constant_38266" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="1496" name="__module.model.gpt_neox.layers.6.attention/aten::index/Gather_1" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="1252"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1497" name="__module.model.gpt_neox.layers.6.attention/aten::unsqueeze/Unsqueeze_1" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="1253,sin.27"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1498" name="__module.model.gpt_neox.layers.6.attention/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1268"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1499" name="__module.model.gpt_neox.layers.6.attention/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1269,1287,1297,query.39,query.41"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1500" name="Constant_3722" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="1225"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1501" name="__module.model.gpt_neox.layers.6.attention/aten::permute/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1226,key.37"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1502" name="Constant_296627" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1503" name="Constant_296630" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1504" name="Constant_296633" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1505" name="__module.model.gpt_neox.layers.6.attention/aten::slice/Slice_6" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1232,k.13"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1506" name="__module.model.gpt_neox.layers.6.attention/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1270"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1507" name="Constant_296637" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1508" name="Constant_296636" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1509" name="__module.model.gpt_neox.layers.6.attention/aten::size/ShapeOf_7" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1510" name="__module.model.gpt_neox.layers.6.attention/aten::size/Constant_7" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="1511" name="__module.model.gpt_neox.layers.6.attention/aten::size/Gather_7" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="1271,1276" /> + </output> + </layer> + <layer id="1512" name="__module.model.gpt_neox.layers.6.attention/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="1513" name="__module.model.gpt_neox.layers.6.attention/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="1273,1274,1278,1279" /> + </output> + </layer> + <layer id="1514" name="Constant_337648" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1515" name="__module.model.gpt_neox.layers.6.attention/aten::slice/Unsqueeze_33" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1516" name="Constant_296635" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1517" name="ScatterUpdate_296638" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1518" name="Constant_296641" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1519" name="Constant_296644" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1520" name="__module.model.gpt_neox.layers.6.attention/aten::slice/Slice_7" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1280,x2.27"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="1521" name="Constant_325255" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1522" name="__module.model.gpt_neox.layers.6.attention/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1281"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="1523" name="Constant_296689" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1524" name="Constant_296694" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1525" name="__module.model.gpt_neox.layers.6.attention/aten::slice/Slice_8" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1275"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="1526" name="__module.model.gpt_neox.layers.6.attention/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1283"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1527" name="__module.model.gpt_neox.layers.6.attention/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1284"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1528" name="__module.model.gpt_neox.layers.6.attention/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1285,1289"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1529" name="__module.model.gpt_neox.layers.6.attention/aten::to/Convert_1" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.6.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1530" name="Constant_432807" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="1531" name="Constant_432800" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1532" name="Constant_432802" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1533" name="Constant_432804" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1534" name="Concat_432805" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1535" name="Broadcast_432808" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1536" name="ReadValue_417396" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.6.valuepresent.6.value" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.6.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1537" name="Constant_401929" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1538" name="Gather_401930" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1539" name="Constant_296739" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1540" name="Constant_296742" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1541" name="Constant_296745" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1542" name="__module.model.gpt_neox.layers.6.attention/aten::slice/Slice_10" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1227"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1543" name="Constant_3736" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="1228"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1544" name="__module.model.gpt_neox.layers.6.attention/aten::permute/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1229"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1545" name="__module.model.gpt_neox.layers.6.attention/aten::cat/Concat_5" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.6.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1546" name="__module.model.gpt_neox.layers.6.attention/aten::slice/Slice_11" type="Const" version="opset1"> + <data element_type="boolean" shape="1, 1, 2048, 2048" offset="259268636" size="4194304" /> + <output> + <port id="0" precision="BOOL" names="1306"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="1547" name="Constant_296749" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="1548" name="Constant_296748" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1549" name="ShapeOf_338465" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1550" name="Constant_338466" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1551" name="Constant_338467" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1552" name="Gather_338468" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" /> + </output> + </layer> + <layer id="1553" name="Add_338469" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="1301" /> + </output> + </layer> + <layer id="1554" name="ShapeOf_338536" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1555" name="Constant_338537" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1556" name="Constant_338538" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1557" name="Gather_338539" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="1299" /> + </output> + </layer> + <layer id="1558" name="__module.model.gpt_neox.layers.6.attention/aten::sub/Subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="1303,1304" /> + </output> + </layer> + <layer id="1559" name="Constant_337650" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1560" name="__module.model.gpt_neox.layers.6.attention/aten::slice/Unsqueeze_44" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1561" name="Constant_296747" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1562" name="ScatterUpdate_296750" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="1563" name="Constant_296751" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="1564" name="Constant_337652" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1565" name="__module.model.gpt_neox.layers.6.attention/aten::slice/Unsqueeze_45" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1566" name="ScatterUpdate_296752" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="1567" name="Constant_296755" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462964" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="1568" name="__module.model.gpt_neox.layers.6.attention/aten::slice/Slice_12" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 0" end_mask="1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + <port id="2" precision="I64"> + <dim>3</dim> + </port> + <port id="3" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="1307"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="1569" name="Constant_296828" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1570" name="Constant_296829" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1571" name="Constant_296825" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1572" name="Constant_296824" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1573" name="ScatterUpdate_296830" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1574" name="Constant_296833" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1575" name="__module.model.gpt_neox.layers.6.attention/aten::slice/Slice_13" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="1308,1309"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="1576" name="__module.model.gpt_neox.layers.6.attention/aten::where/Convert_1" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="1577" name="__module.model.gpt_neox.layers.6.attention/aten::full/Convert" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="263462988" size="4" /> + <output> + <port id="0" precision="FP32" names="1296" /> + </output> + </layer> + <layer id="1578" name="__module.model.gpt_neox.layers.6.attention/aten::where/Select" type="Select" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32" /> + <port id="2" precision="FP32" /> + </input> + <output> + <port id="3" precision="FP32" names="1310,causal_mask.25"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="1579" name="Add_315420" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="1580" name="ShapeOf_315421" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1581" name="Constant_338542" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1582" name="Constant_338543" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1583" name="Gather_338544" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="1294"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1584" name="Constant_268021" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1585" name="Constant_268023" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1586" name="Constant_268025" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1587" name="__module.model.gpt_neox.layers.6.attention/prim::ListConstruct/Concat_1" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="1311"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1588" name="Maximum_315422" type="Maximum" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1589" name="__module.model.gpt_neox.layers.6.attention/aten::add/Add_2" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1313"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="1590" name="__module.model.gpt_neox.layers.6.attention/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1314,1315,sdpa_result.13,tensor.25"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1591" name="Constant_4177" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="1316"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1592" name="__module.model.gpt_neox.layers.6.attention/aten::permute/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1317"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1593" name="__module.model.gpt_neox.layers.6.attention/prim::ListConstruct/Concat_2" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263463020" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="1594" name="__module.model.gpt_neox.layers.6.attention/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1322"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1595" name="self.model.gpt_neox.layers.6.attention.dense.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 4096" offset="1473364100" size="16777216" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1596" name="Convert_449130" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1597" name="self.model.gpt_neox.layers.6.attention.dense.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="1490141316" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1598" name="Convert_449133" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1599" name="self.model.gpt_neox.layers.6.attention.dense.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1600" name="self.model.gpt_neox.layers.6.attention.dense.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="1490145412" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1601" name="self.model.gpt_neox.layers.6.attention.dense.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1602" name="self.model.gpt_neox.layers.6.attention.dense.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1603" name="__module.model.gpt_neox.layers.6.attention.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1604" name="Constant_325256" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="1490153604" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1605" name="__module.model.gpt_neox.layers.6.attention.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1325,1327,input.27"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1606" name="__module.model.gpt_neox.layers.6/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1331,attn_output.27"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1607" name="__module.model.gpt_neox.layers.6.post_attention_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1608" name="__module.model.gpt_neox.layers.6.post_attention_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1609" name="Constant_325257" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="1490169988" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1610" name="__module.model.gpt_neox.layers.6.post_attention_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1611" name="Constant_325258" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="1490186372" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1612" name="__module.model.gpt_neox.layers.6.post_attention_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1335"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1613" name="self.model.gpt_neox.layers.6.mlp.dense_h_to_4h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 4096" offset="1490202756" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1614" name="Convert_449141" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1615" name="self.model.gpt_neox.layers.6.mlp.dense_h_to_4h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 1" offset="1557311620" size="16384" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1616" name="Convert_449144" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1617" name="self.model.gpt_neox.layers.6.mlp.dense_h_to_4h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1618" name="self.model.gpt_neox.layers.6.mlp.dense_h_to_4h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="16384, 1" offset="1557328004" size="32768" /> + <output> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1619" name="self.model.gpt_neox.layers.6.mlp.dense_h_to_4h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1620" name="self.model.gpt_neox.layers.6.mlp.dense_h_to_4h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1621" name="__module.model.gpt_neox.layers.6.mlp.dense_h_to_4h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="1622" name="Constant_325259" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 16384" offset="1557360772" size="65536" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="1623" name="__module.model.gpt_neox.layers.6.mlp.dense_h_to_4h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1340"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="1624" name="__module.model.gpt_neox.layers.6.mlp.act/aten::gelu/Gelu" type="Gelu" version="opset7"> + <data approximation_mode="ERF" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="1341"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="1625" name="self.model.gpt_neox.layers.6.mlp.dense_4h_to_h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 16384" offset="1557426308" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="1626" name="Convert_449152" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="1627" name="self.model.gpt_neox.layers.6.mlp.dense_4h_to_h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="1624535172" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1628" name="Convert_449155" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1629" name="self.model.gpt_neox.layers.6.mlp.dense_4h_to_h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="1630" name="self.model.gpt_neox.layers.6.mlp.dense_4h_to_h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="1624539268" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1631" name="self.model.gpt_neox.layers.6.mlp.dense_4h_to_h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="1632" name="self.model.gpt_neox.layers.6.mlp.dense_4h_to_h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="1633" name="__module.model.gpt_neox.layers.6.mlp.dense_4h_to_h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1634" name="Constant_325260" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="1624547460" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1635" name="__module.model.gpt_neox.layers.6.mlp.dense_4h_to_h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1344,input.29"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1636" name="__module.model.gpt_neox.layers.6/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1346,1348,hidden_states.15"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1637" name="__module.model.gpt_neox.layers.7.input_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1638" name="__module.model.gpt_neox.layers.7.input_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1639" name="Constant_325261" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="1624563844" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1640" name="__module.model.gpt_neox.layers.7.input_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1641" name="Constant_325262" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="1624580228" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1642" name="__module.model.gpt_neox.layers.7.input_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1358"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1643" name="self.model.gpt_neox.layers.7.attention.query_key_value.weight" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 4096" offset="1624596612" size="50331648" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1644" name="Convert_449163" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1645" name="self.model.gpt_neox.layers.7.attention.query_key_value.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 1" offset="1674928260" size="12288" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1646" name="Convert_449166" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1647" name="self.model.gpt_neox.layers.7.attention.query_key_value.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1648" name="self.model.gpt_neox.layers.7.attention.query_key_value.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="12288, 1" offset="1674940548" size="24576" /> + <output> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1649" name="self.model.gpt_neox.layers.7.attention.query_key_value.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1650" name="self.model.gpt_neox.layers.7.attention.query_key_value.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1651" name="__module.model.gpt_neox.layers.7.attention.query_key_value/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="1652" name="Constant_325263" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 12288" offset="1674965124" size="49152" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="1653" name="__module.model.gpt_neox.layers.7.attention.query_key_value/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1365,qkv.29"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="1654" name="__module.model.gpt_neox.layers.7.attention/prim::ListConstruct/Concat" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171232" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1655" name="__module.model.gpt_neox.layers.7.attention/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1369,qkv.31"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + </output> + </layer> + <layer id="1656" name="Constant_296840" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1657" name="Constant_296843" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1658" name="Constant_296846" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1659" name="__module.model.gpt_neox.layers.7.attention/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1370"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1660" name="Constant_4289" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="1371"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1661" name="__module.model.gpt_neox.layers.7.attention/aten::permute/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1372,query.43"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1662" name="Constant_296852" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1663" name="Constant_296855" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1664" name="Constant_296858" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1665" name="__module.model.gpt_neox.layers.7.attention/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1379,q.15"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1666" name="self.model.gpt_neox.layers.7.attention.rotary_emb.cos_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="257171392" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.7.attention.rotary_emb.cos_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1667" name="__module.model.gpt_neox.layers.7.attention.rotary_emb/aten::slice/Unsqueeze" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1668" name="Constant_296864" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1669" name="Constant_296867" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1670" name="Constant_296870" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1671" name="__module.model.gpt_neox.layers.7.attention/aten::slice/Slice_2" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1373"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1672" name="ShapeOf_338546" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1673" name="Constant_340991" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1674" name="Constant_338548" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1675" name="Gather_338549" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="1383"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1676" name="Constant_432820" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="1677" name="Constant_432813" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1678" name="Constant_432815" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1679" name="Constant_432817" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1680" name="Concat_432818" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1681" name="Broadcast_432821" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1682" name="ReadValue_417398" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.7.keypresent.7.key" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.7.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1683" name="Constant_401932" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1684" name="Gather_401933" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1685" name="ShapeOf_338551" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1686" name="Constant_338552" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1687" name="Constant_338553" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1688" name="Gather_338554" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="1385" /> + </output> + </layer> + <layer id="1689" name="Constant_337654" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1690" name="Reshape_340919" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1691" name="__module.model.gpt_neox.layers.7.attention/aten::add_/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="1384,1388,1389,seq_len.29"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1692" name="__module.model.gpt_neox.layers.7.attention.rotary_emb/aten::slice/Unsqueeze_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1693" name="__module.model.gpt_neox.layers.7.attention.rotary_emb/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1392,1395,cos.29"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1694" name="Constant_38269" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="1695" name="__module.model.gpt_neox.layers.7.attention/aten::index/Gather" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="1398"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1696" name="__module.model.gpt_neox.layers.7.attention/aten::unsqueeze/Unsqueeze" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="1399,cos.31"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1697" name="__module.model.gpt_neox.layers.7.attention/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1403"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1698" name="Constant_296875" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1699" name="Constant_296874" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1700" name="__module.model.gpt_neox.layers.7.attention/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1701" name="__module.model.gpt_neox.layers.7.attention/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="1702" name="__module.model.gpt_neox.layers.7.attention/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="1404,1409" /> + </output> + </layer> + <layer id="1703" name="__module.model.gpt_neox.layers.7.attention/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="1704" name="__module.model.gpt_neox.layers.7.attention/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="1406,1407,1411,1412" /> + </output> + </layer> + <layer id="1705" name="Constant_337656" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1706" name="__module.model.gpt_neox.layers.7.attention/aten::slice/Unsqueeze_17" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1707" name="Constant_296873" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1708" name="ScatterUpdate_296876" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1709" name="Constant_296879" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1710" name="Constant_296882" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1711" name="__module.model.gpt_neox.layers.7.attention/aten::slice/Slice_3" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1413,x2.29"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="1712" name="Constant_325264" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1713" name="__module.model.gpt_neox.layers.7.attention/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1414"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="1714" name="Constant_296927" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1715" name="Constant_296932" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1716" name="__module.model.gpt_neox.layers.7.attention/aten::slice/Slice_4" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1408"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="1717" name="__module.model.gpt_neox.layers.7.attention/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1416"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1718" name="self.model.gpt_neox.layers.7.attention.rotary_emb.sin_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="258220060" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.7.attention.rotary_emb.sin_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1719" name="__module.model.gpt_neox.layers.7.attention.rotary_emb/aten::slice/Unsqueeze_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1720" name="__module.model.gpt_neox.layers.7.attention.rotary_emb/aten::slice/Unsqueeze_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1721" name="__module.model.gpt_neox.layers.7.attention.rotary_emb/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1393,1396,sin.29"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1722" name="Constant_38272" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="1723" name="__module.model.gpt_neox.layers.7.attention/aten::index/Gather_1" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="1401"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1724" name="__module.model.gpt_neox.layers.7.attention/aten::unsqueeze/Unsqueeze_1" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="1402,sin.31"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1725" name="__module.model.gpt_neox.layers.7.attention/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1417"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1726" name="__module.model.gpt_neox.layers.7.attention/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1418,1436,1446,query.45,query.47"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1727" name="Constant_4303" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="1374"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1728" name="__module.model.gpt_neox.layers.7.attention/aten::permute/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1375,key.43"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1729" name="Constant_296978" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1730" name="Constant_296981" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1731" name="Constant_296984" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1732" name="__module.model.gpt_neox.layers.7.attention/aten::slice/Slice_6" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1381,k.15"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1733" name="__module.model.gpt_neox.layers.7.attention/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1419"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1734" name="Constant_296988" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1735" name="Constant_296987" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1736" name="__module.model.gpt_neox.layers.7.attention/aten::size/ShapeOf_7" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1737" name="__module.model.gpt_neox.layers.7.attention/aten::size/Constant_7" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="1738" name="__module.model.gpt_neox.layers.7.attention/aten::size/Gather_7" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="1420,1425" /> + </output> + </layer> + <layer id="1739" name="__module.model.gpt_neox.layers.7.attention/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="1740" name="__module.model.gpt_neox.layers.7.attention/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="1422,1423,1427,1428" /> + </output> + </layer> + <layer id="1741" name="Constant_337658" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1742" name="__module.model.gpt_neox.layers.7.attention/aten::slice/Unsqueeze_33" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1743" name="Constant_296986" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1744" name="ScatterUpdate_296989" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1745" name="Constant_296992" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1746" name="Constant_296995" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1747" name="__module.model.gpt_neox.layers.7.attention/aten::slice/Slice_7" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1429,x2.31"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="1748" name="Constant_325265" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1749" name="__module.model.gpt_neox.layers.7.attention/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1430"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="1750" name="Constant_297040" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1751" name="Constant_297045" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1752" name="__module.model.gpt_neox.layers.7.attention/aten::slice/Slice_8" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1424"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="1753" name="__module.model.gpt_neox.layers.7.attention/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1432"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1754" name="__module.model.gpt_neox.layers.7.attention/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1433"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1755" name="__module.model.gpt_neox.layers.7.attention/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1434,1438"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1756" name="__module.model.gpt_neox.layers.7.attention/aten::to/Convert_1" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.7.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1757" name="Constant_432833" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="1758" name="Constant_432826" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1759" name="Constant_432828" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1760" name="Constant_432830" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1761" name="Concat_432831" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1762" name="Broadcast_432834" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1763" name="ReadValue_417400" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.7.valuepresent.7.value" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.7.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1764" name="Constant_401935" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1765" name="Gather_401936" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1766" name="Constant_297090" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1767" name="Constant_297093" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1768" name="Constant_297096" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1769" name="__module.model.gpt_neox.layers.7.attention/aten::slice/Slice_10" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1376"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1770" name="Constant_4317" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="1377"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1771" name="__module.model.gpt_neox.layers.7.attention/aten::permute/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1378"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1772" name="__module.model.gpt_neox.layers.7.attention/aten::cat/Concat_5" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.7.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1773" name="__module.model.gpt_neox.layers.7.attention/aten::slice/Slice_11" type="Const" version="opset1"> + <data element_type="boolean" shape="1, 1, 2048, 2048" offset="259268636" size="4194304" /> + <output> + <port id="0" precision="BOOL" names="1455"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="1774" name="Constant_297100" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="1775" name="Constant_297099" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1776" name="ShapeOf_338556" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1777" name="Constant_338557" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1778" name="Constant_338558" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1779" name="Gather_338559" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" /> + </output> + </layer> + <layer id="1780" name="Add_338560" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="1450" /> + </output> + </layer> + <layer id="1781" name="ShapeOf_338627" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1782" name="Constant_338628" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1783" name="Constant_338629" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1784" name="Gather_338630" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="1448" /> + </output> + </layer> + <layer id="1785" name="__module.model.gpt_neox.layers.7.attention/aten::sub/Subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="1452,1453" /> + </output> + </layer> + <layer id="1786" name="Constant_337660" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1787" name="__module.model.gpt_neox.layers.7.attention/aten::slice/Unsqueeze_44" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1788" name="Constant_297098" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1789" name="ScatterUpdate_297101" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="1790" name="Constant_297102" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="1791" name="Constant_337662" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1792" name="__module.model.gpt_neox.layers.7.attention/aten::slice/Unsqueeze_45" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1793" name="ScatterUpdate_297103" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="1794" name="Constant_297106" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462964" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="1795" name="__module.model.gpt_neox.layers.7.attention/aten::slice/Slice_12" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 0" end_mask="1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + <port id="2" precision="I64"> + <dim>3</dim> + </port> + <port id="3" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="1456"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="1796" name="Constant_297179" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1797" name="Constant_297180" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1798" name="Constant_297176" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1799" name="Constant_297175" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1800" name="ScatterUpdate_297181" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1801" name="Constant_297184" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1802" name="__module.model.gpt_neox.layers.7.attention/aten::slice/Slice_13" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="1457,1458"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="1803" name="__module.model.gpt_neox.layers.7.attention/aten::where/Convert_1" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="1804" name="__module.model.gpt_neox.layers.7.attention/aten::full/Convert" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="263462988" size="4" /> + <output> + <port id="0" precision="FP32" names="1445" /> + </output> + </layer> + <layer id="1805" name="__module.model.gpt_neox.layers.7.attention/aten::where/Select" type="Select" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32" /> + <port id="2" precision="FP32" /> + </input> + <output> + <port id="3" precision="FP32" names="1459,causal_mask.29"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="1806" name="Add_315492" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="1807" name="ShapeOf_315493" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1808" name="Constant_338633" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1809" name="Constant_338634" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1810" name="Gather_338635" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="1443"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1811" name="Constant_268031" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1812" name="Constant_268033" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1813" name="Constant_268035" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1814" name="__module.model.gpt_neox.layers.7.attention/prim::ListConstruct/Concat_1" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="1460"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1815" name="Maximum_315494" type="Maximum" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1816" name="__module.model.gpt_neox.layers.7.attention/aten::add/Add_2" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1462"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="1817" name="__module.model.gpt_neox.layers.7.attention/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1463,1464,sdpa_result.15,tensor.29"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1818" name="Constant_4758" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="1465"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1819" name="__module.model.gpt_neox.layers.7.attention/aten::permute/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1466"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1820" name="__module.model.gpt_neox.layers.7.attention/prim::ListConstruct/Concat_2" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263463020" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="1821" name="__module.model.gpt_neox.layers.7.attention/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1471"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1822" name="self.model.gpt_neox.layers.7.attention.dense.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 4096" offset="1675014276" size="16777216" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1823" name="Convert_449174" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1824" name="self.model.gpt_neox.layers.7.attention.dense.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="1691791492" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1825" name="Convert_449177" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1826" name="self.model.gpt_neox.layers.7.attention.dense.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1827" name="self.model.gpt_neox.layers.7.attention.dense.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="1691795588" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1828" name="self.model.gpt_neox.layers.7.attention.dense.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1829" name="self.model.gpt_neox.layers.7.attention.dense.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1830" name="__module.model.gpt_neox.layers.7.attention.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1831" name="Constant_325266" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="1691803780" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1832" name="__module.model.gpt_neox.layers.7.attention.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1474,1476,input.31"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1833" name="__module.model.gpt_neox.layers.7/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1480,attn_output.31"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1834" name="__module.model.gpt_neox.layers.7.post_attention_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1835" name="__module.model.gpt_neox.layers.7.post_attention_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1836" name="Constant_325267" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="1691820164" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1837" name="__module.model.gpt_neox.layers.7.post_attention_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1838" name="Constant_325268" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="1691836548" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1839" name="__module.model.gpt_neox.layers.7.post_attention_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1484"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1840" name="self.model.gpt_neox.layers.7.mlp.dense_h_to_4h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 4096" offset="1691852932" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1841" name="Convert_449185" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1842" name="self.model.gpt_neox.layers.7.mlp.dense_h_to_4h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 1" offset="1758961796" size="16384" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1843" name="Convert_449188" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1844" name="self.model.gpt_neox.layers.7.mlp.dense_h_to_4h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1845" name="self.model.gpt_neox.layers.7.mlp.dense_h_to_4h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="16384, 1" offset="1758978180" size="32768" /> + <output> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1846" name="self.model.gpt_neox.layers.7.mlp.dense_h_to_4h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1847" name="self.model.gpt_neox.layers.7.mlp.dense_h_to_4h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1848" name="__module.model.gpt_neox.layers.7.mlp.dense_h_to_4h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="1849" name="Constant_325269" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 16384" offset="1759010948" size="65536" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="1850" name="__module.model.gpt_neox.layers.7.mlp.dense_h_to_4h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1489"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="1851" name="__module.model.gpt_neox.layers.7.mlp.act/aten::gelu/Gelu" type="Gelu" version="opset7"> + <data approximation_mode="ERF" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="1490"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="1852" name="self.model.gpt_neox.layers.7.mlp.dense_4h_to_h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 16384" offset="1759076484" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="1853" name="Convert_449196" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="1854" name="self.model.gpt_neox.layers.7.mlp.dense_4h_to_h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="1826185348" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1855" name="Convert_449199" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1856" name="self.model.gpt_neox.layers.7.mlp.dense_4h_to_h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="1857" name="self.model.gpt_neox.layers.7.mlp.dense_4h_to_h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="1826189444" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1858" name="self.model.gpt_neox.layers.7.mlp.dense_4h_to_h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="1859" name="self.model.gpt_neox.layers.7.mlp.dense_4h_to_h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="1860" name="__module.model.gpt_neox.layers.7.mlp.dense_4h_to_h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1861" name="Constant_325270" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="1826197636" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1862" name="__module.model.gpt_neox.layers.7.mlp.dense_4h_to_h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1493,input.33"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1863" name="__module.model.gpt_neox.layers.7/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1495,1497,hidden_states.17"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1864" name="__module.model.gpt_neox.layers.8.input_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1865" name="__module.model.gpt_neox.layers.8.input_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1866" name="Constant_325271" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="1826214020" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1867" name="__module.model.gpt_neox.layers.8.input_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1868" name="Constant_325272" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="1826230404" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1869" name="__module.model.gpt_neox.layers.8.input_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1507"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1870" name="self.model.gpt_neox.layers.8.attention.query_key_value.weight" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 4096" offset="1826246788" size="50331648" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1871" name="Convert_449207" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1872" name="self.model.gpt_neox.layers.8.attention.query_key_value.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 1" offset="1876578436" size="12288" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1873" name="Convert_449210" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1874" name="self.model.gpt_neox.layers.8.attention.query_key_value.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1875" name="self.model.gpt_neox.layers.8.attention.query_key_value.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="12288, 1" offset="1876590724" size="24576" /> + <output> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1876" name="self.model.gpt_neox.layers.8.attention.query_key_value.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1877" name="self.model.gpt_neox.layers.8.attention.query_key_value.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="1878" name="__module.model.gpt_neox.layers.8.attention.query_key_value/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="1879" name="Constant_325273" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 12288" offset="1876615300" size="49152" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="1880" name="__module.model.gpt_neox.layers.8.attention.query_key_value/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1514,qkv.33"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="1881" name="__module.model.gpt_neox.layers.8.attention/prim::ListConstruct/Concat" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171232" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1882" name="__module.model.gpt_neox.layers.8.attention/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1518,qkv.35"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + </output> + </layer> + <layer id="1883" name="Constant_297191" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1884" name="Constant_297194" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1885" name="Constant_297197" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1886" name="__module.model.gpt_neox.layers.8.attention/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1519"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1887" name="Constant_4870" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="1520"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1888" name="__module.model.gpt_neox.layers.8.attention/aten::permute/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1521,query.49"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1889" name="Constant_297203" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1890" name="Constant_297206" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1891" name="Constant_297209" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1892" name="__module.model.gpt_neox.layers.8.attention/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1528,q.17"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1893" name="self.model.gpt_neox.layers.8.attention.rotary_emb.cos_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="257171392" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.8.attention.rotary_emb.cos_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1894" name="__module.model.gpt_neox.layers.8.attention.rotary_emb/aten::slice/Unsqueeze" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1895" name="Constant_297215" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1896" name="Constant_297218" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1897" name="Constant_297221" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1898" name="__module.model.gpt_neox.layers.8.attention/aten::slice/Slice_2" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1522"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1899" name="ShapeOf_338637" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1900" name="Constant_340994" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1901" name="Constant_338639" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1902" name="Gather_338640" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="1532"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1903" name="Constant_432846" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="1904" name="Constant_432839" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1905" name="Constant_432841" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1906" name="Constant_432843" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1907" name="Concat_432844" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1908" name="Broadcast_432847" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1909" name="ReadValue_417402" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.8.keypresent.8.key" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.8.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1910" name="Constant_401938" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1911" name="Gather_401939" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1912" name="ShapeOf_338642" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1913" name="Constant_338643" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1914" name="Constant_338644" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1915" name="Gather_338645" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="1534" /> + </output> + </layer> + <layer id="1916" name="Constant_337664" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1917" name="Reshape_340921" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1918" name="__module.model.gpt_neox.layers.8.attention/aten::add_/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="1533,1537,1538,seq_len.33"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1919" name="__module.model.gpt_neox.layers.8.attention.rotary_emb/aten::slice/Unsqueeze_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1920" name="__module.model.gpt_neox.layers.8.attention.rotary_emb/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1541,1544,cos.33"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1921" name="Constant_38275" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="1922" name="__module.model.gpt_neox.layers.8.attention/aten::index/Gather" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="1547"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1923" name="__module.model.gpt_neox.layers.8.attention/aten::unsqueeze/Unsqueeze" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="1548,cos.35"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1924" name="__module.model.gpt_neox.layers.8.attention/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1552"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1925" name="Constant_297226" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1926" name="Constant_297225" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1927" name="__module.model.gpt_neox.layers.8.attention/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1928" name="__module.model.gpt_neox.layers.8.attention/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="1929" name="__module.model.gpt_neox.layers.8.attention/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="1553,1558" /> + </output> + </layer> + <layer id="1930" name="__module.model.gpt_neox.layers.8.attention/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="1931" name="__module.model.gpt_neox.layers.8.attention/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="1555,1556,1560,1561" /> + </output> + </layer> + <layer id="1932" name="Constant_337666" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1933" name="__module.model.gpt_neox.layers.8.attention/aten::slice/Unsqueeze_17" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1934" name="Constant_297224" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1935" name="ScatterUpdate_297227" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1936" name="Constant_297230" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1937" name="Constant_297233" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1938" name="__module.model.gpt_neox.layers.8.attention/aten::slice/Slice_3" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1562,x2.33"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="1939" name="Constant_325274" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1940" name="__module.model.gpt_neox.layers.8.attention/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1563"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="1941" name="Constant_297278" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1942" name="Constant_297283" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1943" name="__module.model.gpt_neox.layers.8.attention/aten::slice/Slice_4" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1557"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="1944" name="__module.model.gpt_neox.layers.8.attention/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1565"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1945" name="self.model.gpt_neox.layers.8.attention.rotary_emb.sin_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="258220060" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.8.attention.rotary_emb.sin_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1946" name="__module.model.gpt_neox.layers.8.attention.rotary_emb/aten::slice/Unsqueeze_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1947" name="__module.model.gpt_neox.layers.8.attention.rotary_emb/aten::slice/Unsqueeze_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1948" name="__module.model.gpt_neox.layers.8.attention.rotary_emb/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1542,1545,sin.33"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1949" name="Constant_38278" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="1950" name="__module.model.gpt_neox.layers.8.attention/aten::index/Gather_1" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="1550"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1951" name="__module.model.gpt_neox.layers.8.attention/aten::unsqueeze/Unsqueeze_1" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="1551,sin.35"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1952" name="__module.model.gpt_neox.layers.8.attention/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1566"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1953" name="__module.model.gpt_neox.layers.8.attention/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1567,1585,1595,query.51,query.53"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1954" name="Constant_4884" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="1523"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1955" name="__module.model.gpt_neox.layers.8.attention/aten::permute/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1524,key.49"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1956" name="Constant_297329" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1957" name="Constant_297332" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1958" name="Constant_297335" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1959" name="__module.model.gpt_neox.layers.8.attention/aten::slice/Slice_6" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1530,k.17"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1960" name="__module.model.gpt_neox.layers.8.attention/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1568"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1961" name="Constant_297339" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1962" name="Constant_297338" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1963" name="__module.model.gpt_neox.layers.8.attention/aten::size/ShapeOf_7" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1964" name="__module.model.gpt_neox.layers.8.attention/aten::size/Constant_7" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="1965" name="__module.model.gpt_neox.layers.8.attention/aten::size/Gather_7" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="1569,1574" /> + </output> + </layer> + <layer id="1966" name="__module.model.gpt_neox.layers.8.attention/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="1967" name="__module.model.gpt_neox.layers.8.attention/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="1571,1572,1576,1577" /> + </output> + </layer> + <layer id="1968" name="Constant_337668" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1969" name="__module.model.gpt_neox.layers.8.attention/aten::slice/Unsqueeze_33" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1970" name="Constant_297337" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1971" name="ScatterUpdate_297340" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1972" name="Constant_297343" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1973" name="Constant_297346" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1974" name="__module.model.gpt_neox.layers.8.attention/aten::slice/Slice_7" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1578,x2.35"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="1975" name="Constant_325275" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1976" name="__module.model.gpt_neox.layers.8.attention/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1579"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="1977" name="Constant_297391" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1978" name="Constant_297396" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1979" name="__module.model.gpt_neox.layers.8.attention/aten::slice/Slice_8" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1573"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="1980" name="__module.model.gpt_neox.layers.8.attention/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1581"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1981" name="__module.model.gpt_neox.layers.8.attention/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1582"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1982" name="__module.model.gpt_neox.layers.8.attention/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1583,1587"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1983" name="__module.model.gpt_neox.layers.8.attention/aten::to/Convert_1" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.8.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1984" name="Constant_432859" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="1985" name="Constant_432852" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1986" name="Constant_432854" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1987" name="Constant_432856" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1988" name="Concat_432857" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1989" name="Broadcast_432860" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1990" name="ReadValue_417404" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.8.valuepresent.8.value" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.8.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1991" name="Constant_401941" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1992" name="Gather_401942" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1993" name="Constant_297441" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1994" name="Constant_297444" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1995" name="Constant_297447" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1996" name="__module.model.gpt_neox.layers.8.attention/aten::slice/Slice_10" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1525"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1997" name="Constant_4898" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="1526"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1998" name="__module.model.gpt_neox.layers.8.attention/aten::permute/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1527"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1999" name="__module.model.gpt_neox.layers.8.attention/aten::cat/Concat_5" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.8.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2000" name="__module.model.gpt_neox.layers.8.attention/aten::slice/Slice_11" type="Const" version="opset1"> + <data element_type="boolean" shape="1, 1, 2048, 2048" offset="259268636" size="4194304" /> + <output> + <port id="0" precision="BOOL" names="1604"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="2001" name="Constant_297451" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="2002" name="Constant_297450" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2003" name="ShapeOf_338647" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2004" name="Constant_338648" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2005" name="Constant_338649" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2006" name="Gather_338650" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" /> + </output> + </layer> + <layer id="2007" name="Add_338651" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="1599" /> + </output> + </layer> + <layer id="2008" name="ShapeOf_338718" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2009" name="Constant_338719" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2010" name="Constant_338720" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2011" name="Gather_338721" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="1597" /> + </output> + </layer> + <layer id="2012" name="__module.model.gpt_neox.layers.8.attention/aten::sub/Subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="1601,1602" /> + </output> + </layer> + <layer id="2013" name="Constant_337670" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2014" name="__module.model.gpt_neox.layers.8.attention/aten::slice/Unsqueeze_44" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2015" name="Constant_297449" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2016" name="ScatterUpdate_297452" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="2017" name="Constant_297453" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="2018" name="Constant_337672" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2019" name="__module.model.gpt_neox.layers.8.attention/aten::slice/Unsqueeze_45" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2020" name="ScatterUpdate_297454" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="2021" name="Constant_297457" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462964" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="2022" name="__module.model.gpt_neox.layers.8.attention/aten::slice/Slice_12" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 0" end_mask="1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + <port id="2" precision="I64"> + <dim>3</dim> + </port> + <port id="3" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="1605"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="2023" name="Constant_297530" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2024" name="Constant_297531" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2025" name="Constant_297527" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2026" name="Constant_297526" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2027" name="ScatterUpdate_297532" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2028" name="Constant_297535" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2029" name="__module.model.gpt_neox.layers.8.attention/aten::slice/Slice_13" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="1606,1607"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="2030" name="__module.model.gpt_neox.layers.8.attention/aten::where/Convert_1" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="2031" name="__module.model.gpt_neox.layers.8.attention/aten::full/Convert" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="263462988" size="4" /> + <output> + <port id="0" precision="FP32" names="1594" /> + </output> + </layer> + <layer id="2032" name="__module.model.gpt_neox.layers.8.attention/aten::where/Select" type="Select" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32" /> + <port id="2" precision="FP32" /> + </input> + <output> + <port id="3" precision="FP32" names="1608,causal_mask.33"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="2033" name="Add_315564" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="2034" name="ShapeOf_315565" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2035" name="Constant_338724" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2036" name="Constant_338725" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2037" name="Gather_338726" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="1592"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2038" name="Constant_268041" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2039" name="Constant_268043" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2040" name="Constant_268045" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2041" name="__module.model.gpt_neox.layers.8.attention/prim::ListConstruct/Concat_1" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="1609"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2042" name="Maximum_315566" type="Maximum" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2043" name="__module.model.gpt_neox.layers.8.attention/aten::add/Add_2" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1611"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="2044" name="__module.model.gpt_neox.layers.8.attention/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1612,1613,sdpa_result.17,tensor.33"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2045" name="Constant_5339" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="1614"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2046" name="__module.model.gpt_neox.layers.8.attention/aten::permute/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1615"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2047" name="__module.model.gpt_neox.layers.8.attention/prim::ListConstruct/Concat_2" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263463020" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="2048" name="__module.model.gpt_neox.layers.8.attention/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1620"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2049" name="self.model.gpt_neox.layers.8.attention.dense.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 4096" offset="1876664452" size="16777216" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2050" name="Convert_449218" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2051" name="self.model.gpt_neox.layers.8.attention.dense.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="1893441668" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2052" name="Convert_449221" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2053" name="self.model.gpt_neox.layers.8.attention.dense.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2054" name="self.model.gpt_neox.layers.8.attention.dense.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="1893445764" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2055" name="self.model.gpt_neox.layers.8.attention.dense.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2056" name="self.model.gpt_neox.layers.8.attention.dense.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2057" name="__module.model.gpt_neox.layers.8.attention.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2058" name="Constant_325276" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="1893453956" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2059" name="__module.model.gpt_neox.layers.8.attention.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1623,1625,input.35"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2060" name="__module.model.gpt_neox.layers.8/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1629,attn_output.35"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2061" name="__module.model.gpt_neox.layers.8.post_attention_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2062" name="__module.model.gpt_neox.layers.8.post_attention_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2063" name="Constant_325277" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="1893470340" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2064" name="__module.model.gpt_neox.layers.8.post_attention_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2065" name="Constant_325278" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="1893486724" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2066" name="__module.model.gpt_neox.layers.8.post_attention_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1633"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2067" name="self.model.gpt_neox.layers.8.mlp.dense_h_to_4h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 4096" offset="1893503108" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2068" name="Convert_449229" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2069" name="self.model.gpt_neox.layers.8.mlp.dense_h_to_4h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 1" offset="1960611972" size="16384" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2070" name="Convert_449232" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2071" name="self.model.gpt_neox.layers.8.mlp.dense_h_to_4h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2072" name="self.model.gpt_neox.layers.8.mlp.dense_h_to_4h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="16384, 1" offset="1960628356" size="32768" /> + <output> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2073" name="self.model.gpt_neox.layers.8.mlp.dense_h_to_4h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2074" name="self.model.gpt_neox.layers.8.mlp.dense_h_to_4h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2075" name="__module.model.gpt_neox.layers.8.mlp.dense_h_to_4h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="2076" name="Constant_325279" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 16384" offset="1960661124" size="65536" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="2077" name="__module.model.gpt_neox.layers.8.mlp.dense_h_to_4h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1638"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="2078" name="__module.model.gpt_neox.layers.8.mlp.act/aten::gelu/Gelu" type="Gelu" version="opset7"> + <data approximation_mode="ERF" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="1639"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="2079" name="self.model.gpt_neox.layers.8.mlp.dense_4h_to_h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 16384" offset="1960726660" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="2080" name="Convert_449240" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="2081" name="self.model.gpt_neox.layers.8.mlp.dense_4h_to_h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="2027835524" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2082" name="Convert_449243" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2083" name="self.model.gpt_neox.layers.8.mlp.dense_4h_to_h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="2084" name="self.model.gpt_neox.layers.8.mlp.dense_4h_to_h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="2027839620" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2085" name="self.model.gpt_neox.layers.8.mlp.dense_4h_to_h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="2086" name="self.model.gpt_neox.layers.8.mlp.dense_4h_to_h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="2087" name="__module.model.gpt_neox.layers.8.mlp.dense_4h_to_h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2088" name="Constant_325280" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="2027847812" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2089" name="__module.model.gpt_neox.layers.8.mlp.dense_4h_to_h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1642,input.37"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2090" name="__module.model.gpt_neox.layers.8/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1644,1646,hidden_states.19"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2091" name="__module.model.gpt_neox.layers.9.input_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2092" name="__module.model.gpt_neox.layers.9.input_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2093" name="Constant_325281" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="2027864196" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2094" name="__module.model.gpt_neox.layers.9.input_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2095" name="Constant_325282" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="2027880580" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2096" name="__module.model.gpt_neox.layers.9.input_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1656"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2097" name="self.model.gpt_neox.layers.9.attention.query_key_value.weight" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 4096" offset="2027896964" size="50331648" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2098" name="Convert_449251" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2099" name="self.model.gpt_neox.layers.9.attention.query_key_value.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 1" offset="2078228612" size="12288" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2100" name="Convert_449254" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2101" name="self.model.gpt_neox.layers.9.attention.query_key_value.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2102" name="self.model.gpt_neox.layers.9.attention.query_key_value.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="12288, 1" offset="2078240900" size="24576" /> + <output> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2103" name="self.model.gpt_neox.layers.9.attention.query_key_value.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2104" name="self.model.gpt_neox.layers.9.attention.query_key_value.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2105" name="__module.model.gpt_neox.layers.9.attention.query_key_value/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="2106" name="Constant_325283" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 12288" offset="2078265476" size="49152" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="2107" name="__module.model.gpt_neox.layers.9.attention.query_key_value/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1663,qkv.37"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="2108" name="__module.model.gpt_neox.layers.9.attention/prim::ListConstruct/Concat" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171232" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2109" name="__module.model.gpt_neox.layers.9.attention/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1667,qkv.39"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + </output> + </layer> + <layer id="2110" name="Constant_297792" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2111" name="Constant_297795" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2112" name="Constant_297798" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2113" name="__module.model.gpt_neox.layers.9.attention/aten::slice/Slice_10" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1674"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2114" name="Constant_5479" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="1675"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2115" name="__module.model.gpt_neox.layers.9.attention/aten::permute/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1676"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2116" name="__module.model.gpt_neox.layers.9.attention/aten::cat/Concat_5" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.9.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2118" name="Constant_432872" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="2119" name="Constant_432865" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2120" name="Constant_432867" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2121" name="Constant_432869" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2122" name="Concat_432870" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2123" name="Broadcast_432873" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2124" name="ReadValue_417406" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.9.keypresent.9.key" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.9.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2125" name="Constant_401944" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2126" name="Gather_401945" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2127" name="Constant_297566" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2128" name="Constant_297569" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2129" name="Constant_297572" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2130" name="__module.model.gpt_neox.layers.9.attention/aten::slice/Slice_2" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1671"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2131" name="Constant_5465" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="1672"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2132" name="__module.model.gpt_neox.layers.9.attention/aten::permute/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1673,key.55"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2133" name="Constant_297680" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2134" name="Constant_297683" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2135" name="Constant_297686" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2136" name="__module.model.gpt_neox.layers.9.attention/aten::slice/Slice_6" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1679,k.19"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2137" name="self.model.gpt_neox.layers.9.attention.rotary_emb.cos_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="257171392" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.9.attention.rotary_emb.cos_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2138" name="__module.model.gpt_neox.layers.9.attention.rotary_emb/aten::slice/Unsqueeze" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2139" name="ShapeOf_338728" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2140" name="Constant_340997" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2141" name="Constant_338730" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2142" name="Gather_338731" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="1681"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2143" name="ShapeOf_338733" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2144" name="Constant_338734" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2145" name="Constant_338735" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2146" name="Gather_338736" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="1683" /> + </output> + </layer> + <layer id="2147" name="Constant_337674" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2148" name="Reshape_340923" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2149" name="__module.model.gpt_neox.layers.9.attention/aten::add_/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="1682,1686,1687,seq_len.37"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2150" name="__module.model.gpt_neox.layers.9.attention.rotary_emb/aten::slice/Unsqueeze_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2151" name="__module.model.gpt_neox.layers.9.attention.rotary_emb/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1690,1693,cos.37"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2152" name="Constant_38281" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="2153" name="__module.model.gpt_neox.layers.9.attention/aten::index/Gather" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="1696"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2154" name="__module.model.gpt_neox.layers.9.attention/aten::unsqueeze/Unsqueeze" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="1697,cos.39"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2155" name="__module.model.gpt_neox.layers.9.attention/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1717"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2156" name="Constant_297690" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2157" name="Constant_297689" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2158" name="__module.model.gpt_neox.layers.9.attention/aten::size/ShapeOf_7" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2159" name="__module.model.gpt_neox.layers.9.attention/aten::size/Constant_7" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="2160" name="__module.model.gpt_neox.layers.9.attention/aten::size/Gather_7" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="1718,1723" /> + </output> + </layer> + <layer id="2161" name="__module.model.gpt_neox.layers.9.attention/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="2162" name="__module.model.gpt_neox.layers.9.attention/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="1720,1721,1725,1726" /> + </output> + </layer> + <layer id="2163" name="Constant_337678" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2164" name="__module.model.gpt_neox.layers.9.attention/aten::slice/Unsqueeze_33" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2165" name="Constant_297688" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2166" name="ScatterUpdate_297691" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2167" name="Constant_297694" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2168" name="Constant_297697" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2169" name="__module.model.gpt_neox.layers.9.attention/aten::slice/Slice_7" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1727,x2.39"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="2170" name="Constant_325285" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2171" name="__module.model.gpt_neox.layers.9.attention/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1728"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="2172" name="Constant_297742" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2173" name="Constant_297747" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2174" name="__module.model.gpt_neox.layers.9.attention/aten::slice/Slice_8" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1722"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="2175" name="__module.model.gpt_neox.layers.9.attention/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1730"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2176" name="self.model.gpt_neox.layers.9.attention.rotary_emb.sin_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="258220060" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.9.attention.rotary_emb.sin_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2177" name="__module.model.gpt_neox.layers.9.attention.rotary_emb/aten::slice/Unsqueeze_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2178" name="__module.model.gpt_neox.layers.9.attention.rotary_emb/aten::slice/Unsqueeze_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2179" name="__module.model.gpt_neox.layers.9.attention.rotary_emb/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1691,1694,sin.37"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2180" name="Constant_38284" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="2181" name="__module.model.gpt_neox.layers.9.attention/aten::index/Gather_1" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="1699"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2182" name="__module.model.gpt_neox.layers.9.attention/aten::unsqueeze/Unsqueeze_1" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="1700,sin.39"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2183" name="__module.model.gpt_neox.layers.9.attention/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1731"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2184" name="__module.model.gpt_neox.layers.9.attention/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1732,1736"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2185" name="__module.model.gpt_neox.layers.9.attention/aten::to/Convert_1" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.9.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2197" name="Constant_432885" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="2198" name="Constant_432878" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2199" name="Constant_432880" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2200" name="Constant_432882" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2201" name="Concat_432883" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2202" name="Broadcast_432886" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2203" name="ReadValue_417384" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.31.valuepresent.31.value" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.31.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2204" name="Constant_402079" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2205" name="Gather_402080" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2206" name="Constant_297542" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2207" name="Constant_297545" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2208" name="Constant_297548" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2209" name="__module.model.gpt_neox.layers.9.attention/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1668"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2210" name="Constant_5451" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="1669"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2211" name="__module.model.gpt_neox.layers.9.attention/aten::permute/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1670,query.55"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2212" name="Constant_297554" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2213" name="Constant_297557" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2214" name="Constant_297560" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2215" name="__module.model.gpt_neox.layers.9.attention/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1677,q.19"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2216" name="__module.model.gpt_neox.layers.9.attention/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1701"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2217" name="Constant_297577" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2218" name="Constant_297576" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2219" name="__module.model.gpt_neox.layers.9.attention/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2220" name="__module.model.gpt_neox.layers.9.attention/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="2221" name="__module.model.gpt_neox.layers.9.attention/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="1702,1707" /> + </output> + </layer> + <layer id="2222" name="__module.model.gpt_neox.layers.9.attention/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="2223" name="__module.model.gpt_neox.layers.9.attention/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="1704,1705,1709,1710" /> + </output> + </layer> + <layer id="2224" name="Constant_337676" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2225" name="__module.model.gpt_neox.layers.9.attention/aten::slice/Unsqueeze_17" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2226" name="Constant_297575" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2227" name="ScatterUpdate_297578" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2228" name="Constant_297581" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2229" name="Constant_297584" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2230" name="__module.model.gpt_neox.layers.9.attention/aten::slice/Slice_3" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1711,x2.37"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="2231" name="Constant_325284" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2232" name="__module.model.gpt_neox.layers.9.attention/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1712"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="2233" name="Constant_297629" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2234" name="Constant_297634" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2235" name="__module.model.gpt_neox.layers.9.attention/aten::slice/Slice_4" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1706"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="2236" name="__module.model.gpt_neox.layers.9.attention/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1714"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2237" name="__module.model.gpt_neox.layers.9.attention/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1715"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2238" name="__module.model.gpt_neox.layers.9.attention/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1716,1734,1744,query.57,query.59"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2239" name="__module.model.gpt_neox.layers.9.attention/aten::slice/Slice_11" type="Const" version="opset1"> + <data element_type="boolean" shape="1, 1, 2048, 2048" offset="259268636" size="4194304" /> + <output> + <port id="0" precision="BOOL" names="1753"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="2240" name="Constant_297802" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="2241" name="Constant_297801" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2242" name="ShapeOf_338738" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2243" name="Constant_338739" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2244" name="Constant_338740" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2245" name="Gather_338741" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" /> + </output> + </layer> + <layer id="2246" name="Add_338742" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="1748" /> + </output> + </layer> + <layer id="2247" name="ShapeOf_338809" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2248" name="Constant_338810" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2249" name="Constant_338811" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2250" name="Gather_338812" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="1746" /> + </output> + </layer> + <layer id="2251" name="__module.model.gpt_neox.layers.9.attention/aten::sub/Subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="1750,1751" /> + </output> + </layer> + <layer id="2252" name="Constant_337680" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2253" name="__module.model.gpt_neox.layers.9.attention/aten::slice/Unsqueeze_44" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2254" name="Constant_297800" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2255" name="ScatterUpdate_297803" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="2256" name="Constant_297804" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="2257" name="Constant_337682" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2258" name="__module.model.gpt_neox.layers.9.attention/aten::slice/Unsqueeze_45" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2259" name="ScatterUpdate_297805" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="2260" name="Constant_297808" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462964" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="2261" name="__module.model.gpt_neox.layers.9.attention/aten::slice/Slice_12" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 0" end_mask="1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + <port id="2" precision="I64"> + <dim>3</dim> + </port> + <port id="3" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="1754"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="2262" name="Constant_297881" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2263" name="Constant_297882" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2264" name="Constant_297878" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2265" name="Constant_297877" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2266" name="ScatterUpdate_297883" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2267" name="Constant_297886" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2268" name="__module.model.gpt_neox.layers.9.attention/aten::slice/Slice_13" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="1755,1756"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="2269" name="__module.model.gpt_neox.layers.9.attention/aten::where/Convert_1" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="2270" name="__module.model.gpt_neox.layers.9.attention/aten::full/Convert" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="263462988" size="4" /> + <output> + <port id="0" precision="FP32" names="1743" /> + </output> + </layer> + <layer id="2271" name="__module.model.gpt_neox.layers.9.attention/aten::where/Select" type="Select" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32" /> + <port id="2" precision="FP32" /> + </input> + <output> + <port id="3" precision="FP32" names="1757,causal_mask.37"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="2272" name="Add_315636" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="2273" name="ShapeOf_315637" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2274" name="Constant_338815" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2275" name="Constant_338816" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2276" name="Gather_338817" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="1741"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2277" name="Constant_268051" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2278" name="Constant_268053" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2279" name="Constant_268055" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2280" name="__module.model.gpt_neox.layers.9.attention/prim::ListConstruct/Concat_1" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="1758"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2281" name="Maximum_315638" type="Maximum" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2282" name="__module.model.gpt_neox.layers.9.attention/aten::add/Add_2" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1760"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="2283" name="__module.model.gpt_neox.layers.9.attention/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1761,1762,sdpa_result.19,tensor.37"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2284" name="Constant_5920" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="1763"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2285" name="__module.model.gpt_neox.layers.9.attention/aten::permute/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1764"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2286" name="__module.model.gpt_neox.layers.9.attention/prim::ListConstruct/Concat_2" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263463020" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="2287" name="__module.model.gpt_neox.layers.9.attention/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1769"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2288" name="self.model.gpt_neox.layers.9.attention.dense.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 4096" offset="2078314628" size="16777216" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2289" name="Convert_449262" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2290" name="self.model.gpt_neox.layers.9.attention.dense.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="2095091844" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2291" name="Convert_449265" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2292" name="self.model.gpt_neox.layers.9.attention.dense.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2293" name="self.model.gpt_neox.layers.9.attention.dense.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="2095095940" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2294" name="self.model.gpt_neox.layers.9.attention.dense.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2295" name="self.model.gpt_neox.layers.9.attention.dense.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2296" name="__module.model.gpt_neox.layers.9.attention.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2297" name="Constant_325286" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="2095104132" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2298" name="__module.model.gpt_neox.layers.9.attention.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1772,1774,input.39"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2299" name="__module.model.gpt_neox.layers.9/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1778,attn_output.39"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2300" name="__module.model.gpt_neox.layers.9.post_attention_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2301" name="__module.model.gpt_neox.layers.9.post_attention_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2302" name="Constant_325287" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="2095120516" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2303" name="__module.model.gpt_neox.layers.9.post_attention_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2304" name="Constant_325288" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="2095136900" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2305" name="__module.model.gpt_neox.layers.9.post_attention_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1782"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2306" name="self.model.gpt_neox.layers.9.mlp.dense_h_to_4h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 4096" offset="2095153284" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2307" name="Convert_449273" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2308" name="self.model.gpt_neox.layers.9.mlp.dense_h_to_4h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 1" offset="2162262148" size="16384" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2309" name="Convert_449276" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2310" name="self.model.gpt_neox.layers.9.mlp.dense_h_to_4h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2311" name="self.model.gpt_neox.layers.9.mlp.dense_h_to_4h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="16384, 1" offset="2162278532" size="32768" /> + <output> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2312" name="self.model.gpt_neox.layers.9.mlp.dense_h_to_4h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2313" name="self.model.gpt_neox.layers.9.mlp.dense_h_to_4h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2314" name="__module.model.gpt_neox.layers.9.mlp.dense_h_to_4h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="2315" name="Constant_325289" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 16384" offset="2162311300" size="65536" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="2316" name="__module.model.gpt_neox.layers.9.mlp.dense_h_to_4h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1787"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="2317" name="__module.model.gpt_neox.layers.9.mlp.act/aten::gelu/Gelu" type="Gelu" version="opset7"> + <data approximation_mode="ERF" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="1788"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="2318" name="self.model.gpt_neox.layers.9.mlp.dense_4h_to_h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 16384" offset="2162376836" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="2319" name="Convert_449284" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="2320" name="self.model.gpt_neox.layers.9.mlp.dense_4h_to_h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="2229485700" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2321" name="Convert_449287" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2322" name="self.model.gpt_neox.layers.9.mlp.dense_4h_to_h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="2323" name="self.model.gpt_neox.layers.9.mlp.dense_4h_to_h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="2229489796" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2324" name="self.model.gpt_neox.layers.9.mlp.dense_4h_to_h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="2325" name="self.model.gpt_neox.layers.9.mlp.dense_4h_to_h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="2326" name="__module.model.gpt_neox.layers.9.mlp.dense_4h_to_h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2327" name="Constant_325290" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="2229497988" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2328" name="__module.model.gpt_neox.layers.9.mlp.dense_4h_to_h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1791,input.41"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2329" name="__module.model.gpt_neox.layers.9/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1793,1795,hidden_states.21"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2330" name="__module.model.gpt_neox.layers.10.input_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2331" name="__module.model.gpt_neox.layers.10.input_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2332" name="Constant_325291" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="2229514372" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2333" name="__module.model.gpt_neox.layers.10.input_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2334" name="Constant_325292" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="2229530756" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2335" name="__module.model.gpt_neox.layers.10.input_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1805"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2336" name="self.model.gpt_neox.layers.10.attention.query_key_value.weight" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 4096" offset="2229547140" size="50331648" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2337" name="Convert_449295" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2338" name="self.model.gpt_neox.layers.10.attention.query_key_value.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 1" offset="2279878788" size="12288" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2339" name="Convert_449298" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2340" name="self.model.gpt_neox.layers.10.attention.query_key_value.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2341" name="self.model.gpt_neox.layers.10.attention.query_key_value.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="12288, 1" offset="2279891076" size="24576" /> + <output> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2342" name="self.model.gpt_neox.layers.10.attention.query_key_value.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2343" name="self.model.gpt_neox.layers.10.attention.query_key_value.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2344" name="__module.model.gpt_neox.layers.10.attention.query_key_value/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="2345" name="Constant_325293" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 12288" offset="2279915652" size="49152" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="2346" name="__module.model.gpt_neox.layers.10.attention.query_key_value/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1812,qkv.41"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="2347" name="__module.model.gpt_neox.layers.10.attention/prim::ListConstruct/Concat" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171232" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2348" name="__module.model.gpt_neox.layers.10.attention/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1816,qkv.43"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + </output> + </layer> + <layer id="2349" name="Constant_297893" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2350" name="Constant_297896" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2351" name="Constant_297899" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2352" name="__module.model.gpt_neox.layers.10.attention/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1817"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2353" name="Constant_6032" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="1818"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2354" name="__module.model.gpt_neox.layers.10.attention/aten::permute/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1819,query.61"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2355" name="Constant_297905" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2356" name="Constant_297908" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2357" name="Constant_297911" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2358" name="__module.model.gpt_neox.layers.10.attention/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1826,q.21"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2359" name="self.model.gpt_neox.layers.10.attention.rotary_emb.cos_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="257171392" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.10.attention.rotary_emb.cos_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2360" name="__module.model.gpt_neox.layers.10.attention.rotary_emb/aten::slice/Unsqueeze" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2361" name="Constant_297917" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2362" name="Constant_297920" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2363" name="Constant_297923" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2364" name="__module.model.gpt_neox.layers.10.attention/aten::slice/Slice_2" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1820"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2365" name="ShapeOf_338819" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2366" name="Constant_341000" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2367" name="Constant_338821" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2368" name="Gather_338822" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="1830"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2369" name="Constant_432898" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="2370" name="Constant_432891" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2371" name="Constant_432893" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2372" name="Constant_432895" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2373" name="Concat_432896" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2374" name="Broadcast_432899" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2375" name="ReadValue_417290" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.10.keypresent.10.key" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.10.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2376" name="Constant_401950" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2377" name="Gather_401951" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2378" name="ShapeOf_338824" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2379" name="Constant_338825" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2380" name="Constant_338826" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2381" name="Gather_338827" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="1832" /> + </output> + </layer> + <layer id="2382" name="Constant_337684" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2383" name="Reshape_340925" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2384" name="__module.model.gpt_neox.layers.10.attention/aten::add_/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="1831,1835,1836,seq_len.41"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2385" name="__module.model.gpt_neox.layers.10.attention.rotary_emb/aten::slice/Unsqueeze_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2386" name="__module.model.gpt_neox.layers.10.attention.rotary_emb/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1839,1842,cos.41"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2387" name="Constant_38287" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="2388" name="__module.model.gpt_neox.layers.10.attention/aten::index/Gather" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="1845"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2389" name="__module.model.gpt_neox.layers.10.attention/aten::unsqueeze/Unsqueeze" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="1846,cos.43"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2390" name="__module.model.gpt_neox.layers.10.attention/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1850"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2391" name="Constant_297928" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2392" name="Constant_297927" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2393" name="__module.model.gpt_neox.layers.10.attention/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2394" name="__module.model.gpt_neox.layers.10.attention/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="2395" name="__module.model.gpt_neox.layers.10.attention/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="1851,1856" /> + </output> + </layer> + <layer id="2396" name="__module.model.gpt_neox.layers.10.attention/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="2397" name="__module.model.gpt_neox.layers.10.attention/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="1853,1854,1858,1859" /> + </output> + </layer> + <layer id="2398" name="Constant_337686" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2399" name="__module.model.gpt_neox.layers.10.attention/aten::slice/Unsqueeze_17" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2400" name="Constant_297926" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2401" name="ScatterUpdate_297929" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2402" name="Constant_297932" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2403" name="Constant_297935" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2404" name="__module.model.gpt_neox.layers.10.attention/aten::slice/Slice_3" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1860,x2.41"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="2405" name="Constant_325294" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2406" name="__module.model.gpt_neox.layers.10.attention/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1861"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="2407" name="Constant_297980" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2408" name="Constant_297985" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2409" name="__module.model.gpt_neox.layers.10.attention/aten::slice/Slice_4" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1855"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="2410" name="__module.model.gpt_neox.layers.10.attention/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1863"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2411" name="self.model.gpt_neox.layers.10.attention.rotary_emb.sin_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="258220060" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.10.attention.rotary_emb.sin_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2412" name="__module.model.gpt_neox.layers.10.attention.rotary_emb/aten::slice/Unsqueeze_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2413" name="__module.model.gpt_neox.layers.10.attention.rotary_emb/aten::slice/Unsqueeze_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2414" name="__module.model.gpt_neox.layers.10.attention.rotary_emb/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1840,1843,sin.41"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2415" name="Constant_38290" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="2416" name="__module.model.gpt_neox.layers.10.attention/aten::index/Gather_1" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="1848"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2417" name="__module.model.gpt_neox.layers.10.attention/aten::unsqueeze/Unsqueeze_1" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="1849,sin.43"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2418" name="__module.model.gpt_neox.layers.10.attention/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1864"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2419" name="__module.model.gpt_neox.layers.10.attention/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1865,1883,1893,query.63,query.65"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2420" name="Constant_6046" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="1821"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2421" name="__module.model.gpt_neox.layers.10.attention/aten::permute/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1822,key.61"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2422" name="Constant_298031" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2423" name="Constant_298034" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2424" name="Constant_298037" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2425" name="__module.model.gpt_neox.layers.10.attention/aten::slice/Slice_6" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1828,k.21"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2426" name="__module.model.gpt_neox.layers.10.attention/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1866"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2427" name="Constant_298041" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2428" name="Constant_298040" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2429" name="__module.model.gpt_neox.layers.10.attention/aten::size/ShapeOf_7" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2430" name="__module.model.gpt_neox.layers.10.attention/aten::size/Constant_7" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="2431" name="__module.model.gpt_neox.layers.10.attention/aten::size/Gather_7" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="1867,1872" /> + </output> + </layer> + <layer id="2432" name="__module.model.gpt_neox.layers.10.attention/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="2433" name="__module.model.gpt_neox.layers.10.attention/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="1869,1870,1874,1875" /> + </output> + </layer> + <layer id="2434" name="Constant_337688" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2435" name="__module.model.gpt_neox.layers.10.attention/aten::slice/Unsqueeze_33" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2436" name="Constant_298039" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2437" name="ScatterUpdate_298042" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2438" name="Constant_298045" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2439" name="Constant_298048" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2440" name="__module.model.gpt_neox.layers.10.attention/aten::slice/Slice_7" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1876,x2.43"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="2441" name="Constant_325295" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2442" name="__module.model.gpt_neox.layers.10.attention/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1877"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="2443" name="Constant_298093" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2444" name="Constant_298098" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2445" name="__module.model.gpt_neox.layers.10.attention/aten::slice/Slice_8" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1871"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="2446" name="__module.model.gpt_neox.layers.10.attention/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1879"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2447" name="__module.model.gpt_neox.layers.10.attention/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1880"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2448" name="__module.model.gpt_neox.layers.10.attention/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1881,1885"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2449" name="__module.model.gpt_neox.layers.10.attention/aten::to/Convert_1" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.10.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2450" name="Constant_432911" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="2451" name="Constant_432904" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2452" name="Constant_432906" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2453" name="Constant_432908" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2454" name="Concat_432909" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2455" name="Broadcast_432912" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2456" name="ReadValue_417292" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.10.valuepresent.10.value" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.10.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2457" name="Constant_401953" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2458" name="Gather_401954" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2459" name="Constant_298143" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2460" name="Constant_298146" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2461" name="Constant_298149" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2462" name="__module.model.gpt_neox.layers.10.attention/aten::slice/Slice_10" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1823"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2463" name="Constant_6060" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="1824"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2464" name="__module.model.gpt_neox.layers.10.attention/aten::permute/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1825"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2465" name="__module.model.gpt_neox.layers.10.attention/aten::cat/Concat_5" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.10.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2466" name="__module.model.gpt_neox.layers.10.attention/aten::slice/Slice_11" type="Const" version="opset1"> + <data element_type="boolean" shape="1, 1, 2048, 2048" offset="259268636" size="4194304" /> + <output> + <port id="0" precision="BOOL" names="1902"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="2467" name="Constant_298153" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="2468" name="Constant_298152" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2469" name="ShapeOf_338829" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2470" name="Constant_338830" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2471" name="Constant_338831" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2472" name="Gather_338832" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" /> + </output> + </layer> + <layer id="2473" name="Add_338833" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="1897" /> + </output> + </layer> + <layer id="2474" name="ShapeOf_338900" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2475" name="Constant_338901" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2476" name="Constant_338902" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2477" name="Gather_338903" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="1895" /> + </output> + </layer> + <layer id="2478" name="__module.model.gpt_neox.layers.10.attention/aten::sub/Subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="1899,1900" /> + </output> + </layer> + <layer id="2479" name="Constant_337690" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2480" name="__module.model.gpt_neox.layers.10.attention/aten::slice/Unsqueeze_44" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2481" name="Constant_298151" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2482" name="ScatterUpdate_298154" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="2483" name="Constant_298155" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="2484" name="Constant_337692" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2485" name="__module.model.gpt_neox.layers.10.attention/aten::slice/Unsqueeze_45" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2486" name="ScatterUpdate_298156" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="2487" name="Constant_298159" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462964" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="2488" name="__module.model.gpt_neox.layers.10.attention/aten::slice/Slice_12" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 0" end_mask="1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + <port id="2" precision="I64"> + <dim>3</dim> + </port> + <port id="3" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="1903"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="2489" name="Constant_298232" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2490" name="Constant_298233" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2491" name="Constant_298229" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2492" name="Constant_298228" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2493" name="ScatterUpdate_298234" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2494" name="Constant_298237" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2495" name="__module.model.gpt_neox.layers.10.attention/aten::slice/Slice_13" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="1904,1905"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="2496" name="__module.model.gpt_neox.layers.10.attention/aten::where/Convert_1" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="2497" name="__module.model.gpt_neox.layers.10.attention/aten::full/Convert" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="263462988" size="4" /> + <output> + <port id="0" precision="FP32" names="1892" /> + </output> + </layer> + <layer id="2498" name="__module.model.gpt_neox.layers.10.attention/aten::where/Select" type="Select" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32" /> + <port id="2" precision="FP32" /> + </input> + <output> + <port id="3" precision="FP32" names="1906,causal_mask.41"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="2499" name="Add_315708" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="2500" name="ShapeOf_315709" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2501" name="Constant_338906" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2502" name="Constant_338907" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2503" name="Gather_338908" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="1890"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2504" name="Constant_268061" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2505" name="Constant_268063" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2506" name="Constant_268065" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2507" name="__module.model.gpt_neox.layers.10.attention/prim::ListConstruct/Concat_1" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="1907"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2508" name="Maximum_315710" type="Maximum" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2509" name="__module.model.gpt_neox.layers.10.attention/aten::add/Add_2" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1909"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="2510" name="__module.model.gpt_neox.layers.10.attention/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1910,1911,sdpa_result.21,tensor.41"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2511" name="Constant_6501" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="1912"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2512" name="__module.model.gpt_neox.layers.10.attention/aten::permute/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1913"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2513" name="__module.model.gpt_neox.layers.10.attention/prim::ListConstruct/Concat_2" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263463020" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="2514" name="__module.model.gpt_neox.layers.10.attention/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1918"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2515" name="self.model.gpt_neox.layers.10.attention.dense.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 4096" offset="2279964804" size="16777216" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2516" name="Convert_449306" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2517" name="self.model.gpt_neox.layers.10.attention.dense.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="2296742020" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2518" name="Convert_449309" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2519" name="self.model.gpt_neox.layers.10.attention.dense.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2520" name="self.model.gpt_neox.layers.10.attention.dense.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="2296746116" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2521" name="self.model.gpt_neox.layers.10.attention.dense.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2522" name="self.model.gpt_neox.layers.10.attention.dense.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2523" name="__module.model.gpt_neox.layers.10.attention.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2524" name="Constant_325296" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="2296754308" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2525" name="__module.model.gpt_neox.layers.10.attention.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1921,1923,input.43"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2526" name="__module.model.gpt_neox.layers.10/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1927,attn_output.43"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2527" name="__module.model.gpt_neox.layers.10.post_attention_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2528" name="__module.model.gpt_neox.layers.10.post_attention_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2529" name="Constant_325297" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="2296770692" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2530" name="__module.model.gpt_neox.layers.10.post_attention_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2531" name="Constant_325298" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="2296787076" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2532" name="__module.model.gpt_neox.layers.10.post_attention_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1931"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2533" name="self.model.gpt_neox.layers.10.mlp.dense_h_to_4h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 4096" offset="2296803460" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2534" name="Convert_449317" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2535" name="self.model.gpt_neox.layers.10.mlp.dense_h_to_4h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 1" offset="2363912324" size="16384" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2536" name="Convert_449320" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2537" name="self.model.gpt_neox.layers.10.mlp.dense_h_to_4h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2538" name="self.model.gpt_neox.layers.10.mlp.dense_h_to_4h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="16384, 1" offset="2363928708" size="32768" /> + <output> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2539" name="self.model.gpt_neox.layers.10.mlp.dense_h_to_4h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2540" name="self.model.gpt_neox.layers.10.mlp.dense_h_to_4h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2541" name="__module.model.gpt_neox.layers.10.mlp.dense_h_to_4h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="2542" name="Constant_325299" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 16384" offset="2363961476" size="65536" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="2543" name="__module.model.gpt_neox.layers.10.mlp.dense_h_to_4h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1936"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="2544" name="__module.model.gpt_neox.layers.10.mlp.act/aten::gelu/Gelu" type="Gelu" version="opset7"> + <data approximation_mode="ERF" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="1937"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="2545" name="self.model.gpt_neox.layers.10.mlp.dense_4h_to_h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 16384" offset="2364027012" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="2546" name="Convert_449328" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="2547" name="self.model.gpt_neox.layers.10.mlp.dense_4h_to_h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="2431135876" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2548" name="Convert_449331" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2549" name="self.model.gpt_neox.layers.10.mlp.dense_4h_to_h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="2550" name="self.model.gpt_neox.layers.10.mlp.dense_4h_to_h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="2431139972" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2551" name="self.model.gpt_neox.layers.10.mlp.dense_4h_to_h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="2552" name="self.model.gpt_neox.layers.10.mlp.dense_4h_to_h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="2553" name="__module.model.gpt_neox.layers.10.mlp.dense_4h_to_h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2554" name="Constant_325300" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="2431148164" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2555" name="__module.model.gpt_neox.layers.10.mlp.dense_4h_to_h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1940,input.45"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2556" name="__module.model.gpt_neox.layers.10/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1942,1944,hidden_states.23"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2557" name="__module.model.gpt_neox.layers.11.input_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2558" name="__module.model.gpt_neox.layers.11.input_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2559" name="Constant_325301" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="2431164548" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2560" name="__module.model.gpt_neox.layers.11.input_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2561" name="Constant_325302" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="2431180932" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2562" name="__module.model.gpt_neox.layers.11.input_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1954"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2563" name="self.model.gpt_neox.layers.11.attention.query_key_value.weight" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 4096" offset="2431197316" size="50331648" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2564" name="Convert_449339" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2565" name="self.model.gpt_neox.layers.11.attention.query_key_value.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 1" offset="2481528964" size="12288" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2566" name="Convert_449342" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2567" name="self.model.gpt_neox.layers.11.attention.query_key_value.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2568" name="self.model.gpt_neox.layers.11.attention.query_key_value.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="12288, 1" offset="2481541252" size="24576" /> + <output> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2569" name="self.model.gpt_neox.layers.11.attention.query_key_value.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2570" name="self.model.gpt_neox.layers.11.attention.query_key_value.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2571" name="__module.model.gpt_neox.layers.11.attention.query_key_value/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="2572" name="Constant_325303" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 12288" offset="2481565828" size="49152" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="2573" name="__module.model.gpt_neox.layers.11.attention.query_key_value/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1961,qkv.45"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="2574" name="__module.model.gpt_neox.layers.11.attention/prim::ListConstruct/Concat" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171232" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2575" name="__module.model.gpt_neox.layers.11.attention/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1965,qkv.47"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + </output> + </layer> + <layer id="2576" name="Constant_298244" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2577" name="Constant_298247" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2578" name="Constant_298250" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2579" name="__module.model.gpt_neox.layers.11.attention/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1966"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2580" name="Constant_6613" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="1967"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2581" name="__module.model.gpt_neox.layers.11.attention/aten::permute/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1968,query.67"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2582" name="Constant_298256" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2583" name="Constant_298259" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2584" name="Constant_298262" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2585" name="__module.model.gpt_neox.layers.11.attention/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1975,q.23"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2586" name="self.model.gpt_neox.layers.11.attention.rotary_emb.cos_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="257171392" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.11.attention.rotary_emb.cos_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2587" name="__module.model.gpt_neox.layers.11.attention.rotary_emb/aten::slice/Unsqueeze" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2588" name="Constant_298268" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2589" name="Constant_298271" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2590" name="Constant_298274" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2591" name="__module.model.gpt_neox.layers.11.attention/aten::slice/Slice_2" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1969"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2592" name="ShapeOf_338910" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2593" name="Constant_341003" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2594" name="Constant_338912" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2595" name="Gather_338913" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="1979"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2596" name="Constant_432924" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="2597" name="Constant_432917" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2598" name="Constant_432919" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2599" name="Constant_432921" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2600" name="Concat_432922" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2601" name="Broadcast_432925" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2602" name="ReadValue_417294" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.11.keypresent.11.key" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.11.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2603" name="Constant_401956" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2604" name="Gather_401957" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2605" name="ShapeOf_338915" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2606" name="Constant_338916" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2607" name="Constant_338917" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2608" name="Gather_338918" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="1981" /> + </output> + </layer> + <layer id="2609" name="Constant_337694" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2610" name="Reshape_340927" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2611" name="__module.model.gpt_neox.layers.11.attention/aten::add_/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="1980,1984,1985,seq_len.45"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2612" name="__module.model.gpt_neox.layers.11.attention.rotary_emb/aten::slice/Unsqueeze_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2613" name="__module.model.gpt_neox.layers.11.attention.rotary_emb/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1988,1991,cos.45"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2614" name="Constant_38293" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="2615" name="__module.model.gpt_neox.layers.11.attention/aten::index/Gather" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="1994"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2616" name="__module.model.gpt_neox.layers.11.attention/aten::unsqueeze/Unsqueeze" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="1995,cos.47"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2617" name="__module.model.gpt_neox.layers.11.attention/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1999"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2618" name="Constant_298279" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2619" name="Constant_298278" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2620" name="__module.model.gpt_neox.layers.11.attention/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2621" name="__module.model.gpt_neox.layers.11.attention/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="2622" name="__module.model.gpt_neox.layers.11.attention/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="2000,2005" /> + </output> + </layer> + <layer id="2623" name="__module.model.gpt_neox.layers.11.attention/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="2624" name="__module.model.gpt_neox.layers.11.attention/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="2002,2003,2007,2008" /> + </output> + </layer> + <layer id="2625" name="Constant_337696" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2626" name="__module.model.gpt_neox.layers.11.attention/aten::slice/Unsqueeze_17" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2627" name="Constant_298277" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2628" name="ScatterUpdate_298280" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2629" name="Constant_298283" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2630" name="Constant_298286" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2631" name="__module.model.gpt_neox.layers.11.attention/aten::slice/Slice_3" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2009,x2.45"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="2632" name="Constant_325304" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2633" name="__module.model.gpt_neox.layers.11.attention/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2010"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="2634" name="Constant_298331" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2635" name="Constant_298336" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2636" name="__module.model.gpt_neox.layers.11.attention/aten::slice/Slice_4" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2004"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="2637" name="__module.model.gpt_neox.layers.11.attention/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2012"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2638" name="self.model.gpt_neox.layers.11.attention.rotary_emb.sin_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="258220060" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.11.attention.rotary_emb.sin_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2639" name="__module.model.gpt_neox.layers.11.attention.rotary_emb/aten::slice/Unsqueeze_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2640" name="__module.model.gpt_neox.layers.11.attention.rotary_emb/aten::slice/Unsqueeze_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2641" name="__module.model.gpt_neox.layers.11.attention.rotary_emb/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1989,1992,sin.45"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2642" name="Constant_38296" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="2643" name="__module.model.gpt_neox.layers.11.attention/aten::index/Gather_1" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="1997"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2644" name="__module.model.gpt_neox.layers.11.attention/aten::unsqueeze/Unsqueeze_1" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="1998,sin.47"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2645" name="__module.model.gpt_neox.layers.11.attention/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2013"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2646" name="__module.model.gpt_neox.layers.11.attention/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2014,2032,2042,query.69,query.71"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2647" name="Constant_6627" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="1970"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2648" name="__module.model.gpt_neox.layers.11.attention/aten::permute/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1971,key.67"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2649" name="Constant_298382" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2650" name="Constant_298385" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2651" name="Constant_298388" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2652" name="__module.model.gpt_neox.layers.11.attention/aten::slice/Slice_6" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1977,k.23"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2653" name="__module.model.gpt_neox.layers.11.attention/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2015"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2654" name="Constant_298392" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2655" name="Constant_298391" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2656" name="__module.model.gpt_neox.layers.11.attention/aten::size/ShapeOf_7" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2657" name="__module.model.gpt_neox.layers.11.attention/aten::size/Constant_7" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="2658" name="__module.model.gpt_neox.layers.11.attention/aten::size/Gather_7" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="2016,2021" /> + </output> + </layer> + <layer id="2659" name="__module.model.gpt_neox.layers.11.attention/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="2660" name="__module.model.gpt_neox.layers.11.attention/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="2018,2019,2023,2024" /> + </output> + </layer> + <layer id="2661" name="Constant_337698" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2662" name="__module.model.gpt_neox.layers.11.attention/aten::slice/Unsqueeze_33" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2663" name="Constant_298390" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2664" name="ScatterUpdate_298393" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2665" name="Constant_298396" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2666" name="Constant_298399" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2667" name="__module.model.gpt_neox.layers.11.attention/aten::slice/Slice_7" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2025,x2.47"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="2668" name="Constant_325305" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2669" name="__module.model.gpt_neox.layers.11.attention/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2026"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="2670" name="Constant_298444" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2671" name="Constant_298449" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2672" name="__module.model.gpt_neox.layers.11.attention/aten::slice/Slice_8" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2020"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="2673" name="__module.model.gpt_neox.layers.11.attention/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2028"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2674" name="__module.model.gpt_neox.layers.11.attention/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2029"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2675" name="__module.model.gpt_neox.layers.11.attention/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2030,2034"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2676" name="__module.model.gpt_neox.layers.11.attention/aten::to/Convert_1" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.11.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2677" name="Constant_432937" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="2678" name="Constant_432930" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2679" name="Constant_432932" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2680" name="Constant_432934" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2681" name="Concat_432935" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2682" name="Broadcast_432938" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2683" name="ReadValue_417296" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.11.valuepresent.11.value" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.11.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2684" name="Constant_401959" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2685" name="Gather_401960" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2686" name="Constant_298494" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2687" name="Constant_298497" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2688" name="Constant_298500" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2689" name="__module.model.gpt_neox.layers.11.attention/aten::slice/Slice_10" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1972"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2690" name="Constant_6641" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="1973"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2691" name="__module.model.gpt_neox.layers.11.attention/aten::permute/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1974"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2692" name="__module.model.gpt_neox.layers.11.attention/aten::cat/Concat_5" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.11.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2693" name="__module.model.gpt_neox.layers.11.attention/aten::slice/Slice_11" type="Const" version="opset1"> + <data element_type="boolean" shape="1, 1, 2048, 2048" offset="259268636" size="4194304" /> + <output> + <port id="0" precision="BOOL" names="2051"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="2694" name="Constant_298504" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="2695" name="Constant_298503" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2696" name="ShapeOf_338920" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2697" name="Constant_338921" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2698" name="Constant_338922" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2699" name="Gather_338923" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" /> + </output> + </layer> + <layer id="2700" name="Add_338924" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="2046" /> + </output> + </layer> + <layer id="2701" name="ShapeOf_338991" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2702" name="Constant_338992" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2703" name="Constant_338993" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2704" name="Gather_338994" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="2044" /> + </output> + </layer> + <layer id="2705" name="__module.model.gpt_neox.layers.11.attention/aten::sub/Subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="2048,2049" /> + </output> + </layer> + <layer id="2706" name="Constant_337700" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2707" name="__module.model.gpt_neox.layers.11.attention/aten::slice/Unsqueeze_44" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2708" name="Constant_298502" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2709" name="ScatterUpdate_298505" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="2710" name="Constant_298506" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="2711" name="Constant_337702" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2712" name="__module.model.gpt_neox.layers.11.attention/aten::slice/Unsqueeze_45" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2713" name="ScatterUpdate_298507" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="2714" name="Constant_298510" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462964" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="2715" name="__module.model.gpt_neox.layers.11.attention/aten::slice/Slice_12" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 0" end_mask="1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + <port id="2" precision="I64"> + <dim>3</dim> + </port> + <port id="3" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="2052"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="2716" name="Constant_298583" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2717" name="Constant_298584" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2718" name="Constant_298580" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2719" name="Constant_298579" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2720" name="ScatterUpdate_298585" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2721" name="Constant_298588" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2722" name="__module.model.gpt_neox.layers.11.attention/aten::slice/Slice_13" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="2053,2054"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="2723" name="__module.model.gpt_neox.layers.11.attention/aten::where/Convert_1" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="2724" name="__module.model.gpt_neox.layers.11.attention/aten::full/Convert" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="263462988" size="4" /> + <output> + <port id="0" precision="FP32" names="2041" /> + </output> + </layer> + <layer id="2725" name="__module.model.gpt_neox.layers.11.attention/aten::where/Select" type="Select" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32" /> + <port id="2" precision="FP32" /> + </input> + <output> + <port id="3" precision="FP32" names="2055,causal_mask.45"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="2726" name="Add_315780" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="2727" name="ShapeOf_315781" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2728" name="Constant_338997" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2729" name="Constant_338998" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2730" name="Gather_338999" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="2039"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2731" name="Constant_268071" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2732" name="Constant_268073" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2733" name="Constant_268075" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2734" name="__module.model.gpt_neox.layers.11.attention/prim::ListConstruct/Concat_1" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="2056"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2735" name="Maximum_315782" type="Maximum" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2736" name="__module.model.gpt_neox.layers.11.attention/aten::add/Add_2" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2058"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="2737" name="__module.model.gpt_neox.layers.11.attention/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2059,2060,sdpa_result.23,tensor.45"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2738" name="Constant_7082" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="2061"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2739" name="__module.model.gpt_neox.layers.11.attention/aten::permute/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2062"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2740" name="__module.model.gpt_neox.layers.11.attention/prim::ListConstruct/Concat_2" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263463020" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="2741" name="__module.model.gpt_neox.layers.11.attention/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2067"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2742" name="self.model.gpt_neox.layers.11.attention.dense.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 4096" offset="2481614980" size="16777216" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2743" name="Convert_449350" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2744" name="self.model.gpt_neox.layers.11.attention.dense.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="2498392196" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2745" name="Convert_449353" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2746" name="self.model.gpt_neox.layers.11.attention.dense.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2747" name="self.model.gpt_neox.layers.11.attention.dense.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="2498396292" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2748" name="self.model.gpt_neox.layers.11.attention.dense.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2749" name="self.model.gpt_neox.layers.11.attention.dense.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2750" name="__module.model.gpt_neox.layers.11.attention.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2751" name="Constant_325306" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="2498404484" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2752" name="__module.model.gpt_neox.layers.11.attention.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2070,2072,input.47"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2753" name="__module.model.gpt_neox.layers.11/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2076,attn_output.47"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2754" name="__module.model.gpt_neox.layers.11.post_attention_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2755" name="__module.model.gpt_neox.layers.11.post_attention_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2756" name="Constant_325307" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="2498420868" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2757" name="__module.model.gpt_neox.layers.11.post_attention_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2758" name="Constant_325308" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="2498437252" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2759" name="__module.model.gpt_neox.layers.11.post_attention_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2080"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2760" name="self.model.gpt_neox.layers.11.mlp.dense_h_to_4h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 4096" offset="2498453636" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2761" name="Convert_449361" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2762" name="self.model.gpt_neox.layers.11.mlp.dense_h_to_4h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 1" offset="2565562500" size="16384" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2763" name="Convert_449364" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2764" name="self.model.gpt_neox.layers.11.mlp.dense_h_to_4h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2765" name="self.model.gpt_neox.layers.11.mlp.dense_h_to_4h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="16384, 1" offset="2565578884" size="32768" /> + <output> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2766" name="self.model.gpt_neox.layers.11.mlp.dense_h_to_4h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2767" name="self.model.gpt_neox.layers.11.mlp.dense_h_to_4h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2768" name="__module.model.gpt_neox.layers.11.mlp.dense_h_to_4h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="2769" name="Constant_325309" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 16384" offset="2565611652" size="65536" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="2770" name="__module.model.gpt_neox.layers.11.mlp.dense_h_to_4h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2085"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="2771" name="__module.model.gpt_neox.layers.11.mlp.act/aten::gelu/Gelu" type="Gelu" version="opset7"> + <data approximation_mode="ERF" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="2086"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="2772" name="self.model.gpt_neox.layers.11.mlp.dense_4h_to_h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 16384" offset="2565677188" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="2773" name="Convert_449372" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="2774" name="self.model.gpt_neox.layers.11.mlp.dense_4h_to_h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="2632786052" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2775" name="Convert_449375" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2776" name="self.model.gpt_neox.layers.11.mlp.dense_4h_to_h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="2777" name="self.model.gpt_neox.layers.11.mlp.dense_4h_to_h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="2632790148" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2778" name="self.model.gpt_neox.layers.11.mlp.dense_4h_to_h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="2779" name="self.model.gpt_neox.layers.11.mlp.dense_4h_to_h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="2780" name="__module.model.gpt_neox.layers.11.mlp.dense_4h_to_h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2781" name="Constant_325310" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="2632798340" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2782" name="__module.model.gpt_neox.layers.11.mlp.dense_4h_to_h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2089,input.49"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2783" name="__module.model.gpt_neox.layers.11/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2091,2093,hidden_states.25"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2784" name="__module.model.gpt_neox.layers.12.input_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2785" name="__module.model.gpt_neox.layers.12.input_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2786" name="Constant_325311" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="2632814724" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2787" name="__module.model.gpt_neox.layers.12.input_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2788" name="Constant_325312" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="2632831108" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2789" name="__module.model.gpt_neox.layers.12.input_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2103"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2790" name="self.model.gpt_neox.layers.12.attention.query_key_value.weight" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 4096" offset="2632847492" size="50331648" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2791" name="Convert_449383" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2792" name="self.model.gpt_neox.layers.12.attention.query_key_value.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 1" offset="2683179140" size="12288" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2793" name="Convert_449386" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2794" name="self.model.gpt_neox.layers.12.attention.query_key_value.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2795" name="self.model.gpt_neox.layers.12.attention.query_key_value.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="12288, 1" offset="2683191428" size="24576" /> + <output> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2796" name="self.model.gpt_neox.layers.12.attention.query_key_value.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2797" name="self.model.gpt_neox.layers.12.attention.query_key_value.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2798" name="__module.model.gpt_neox.layers.12.attention.query_key_value/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="2799" name="Constant_325313" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 12288" offset="2683216004" size="49152" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="2800" name="__module.model.gpt_neox.layers.12.attention.query_key_value/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2110,qkv.49"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="2801" name="__module.model.gpt_neox.layers.12.attention/prim::ListConstruct/Concat" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171232" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2802" name="__module.model.gpt_neox.layers.12.attention/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2114,qkv.51"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + </output> + </layer> + <layer id="2803" name="Constant_298595" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2804" name="Constant_298598" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2805" name="Constant_298601" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2806" name="__module.model.gpt_neox.layers.12.attention/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2115"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2807" name="Constant_7194" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="2116"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2808" name="__module.model.gpt_neox.layers.12.attention/aten::permute/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2117,query.73"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2809" name="Constant_298607" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2810" name="Constant_298610" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2811" name="Constant_298613" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2812" name="__module.model.gpt_neox.layers.12.attention/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2124,q.25"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2813" name="self.model.gpt_neox.layers.12.attention.rotary_emb.cos_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="257171392" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.12.attention.rotary_emb.cos_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2814" name="__module.model.gpt_neox.layers.12.attention.rotary_emb/aten::slice/Unsqueeze" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2815" name="Constant_298619" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2816" name="Constant_298622" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2817" name="Constant_298625" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2818" name="__module.model.gpt_neox.layers.12.attention/aten::slice/Slice_2" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2118"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2819" name="ShapeOf_339001" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2820" name="Constant_341006" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2821" name="Constant_339003" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2822" name="Gather_339004" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="2128"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2823" name="Constant_432950" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="2824" name="Constant_432943" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2825" name="Constant_432945" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2826" name="Constant_432947" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2827" name="Concat_432948" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2828" name="Broadcast_432951" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2829" name="ReadValue_417298" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.12.keypresent.12.key" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.12.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2830" name="Constant_401962" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2831" name="Gather_401963" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2832" name="ShapeOf_339006" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2833" name="Constant_339007" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2834" name="Constant_339008" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2835" name="Gather_339009" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="2130" /> + </output> + </layer> + <layer id="2836" name="Constant_337704" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2837" name="Reshape_340929" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2838" name="__module.model.gpt_neox.layers.12.attention/aten::add_/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="2129,2133,2134,seq_len.49"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2839" name="__module.model.gpt_neox.layers.12.attention.rotary_emb/aten::slice/Unsqueeze_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2840" name="__module.model.gpt_neox.layers.12.attention.rotary_emb/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2137,2140,cos.49"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2841" name="Constant_38299" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="2842" name="__module.model.gpt_neox.layers.12.attention/aten::index/Gather" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="2143"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2843" name="__module.model.gpt_neox.layers.12.attention/aten::unsqueeze/Unsqueeze" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="2144,cos.51"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2844" name="__module.model.gpt_neox.layers.12.attention/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2148"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2845" name="Constant_298630" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2846" name="Constant_298629" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2847" name="__module.model.gpt_neox.layers.12.attention/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2848" name="__module.model.gpt_neox.layers.12.attention/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="2849" name="__module.model.gpt_neox.layers.12.attention/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="2149,2154" /> + </output> + </layer> + <layer id="2850" name="__module.model.gpt_neox.layers.12.attention/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="2851" name="__module.model.gpt_neox.layers.12.attention/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="2151,2152,2156,2157" /> + </output> + </layer> + <layer id="2852" name="Constant_337706" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2853" name="__module.model.gpt_neox.layers.12.attention/aten::slice/Unsqueeze_17" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2854" name="Constant_298628" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2855" name="ScatterUpdate_298631" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2856" name="Constant_298634" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2857" name="Constant_298637" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2858" name="__module.model.gpt_neox.layers.12.attention/aten::slice/Slice_3" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2158,x2.49"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="2859" name="Constant_325314" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2860" name="__module.model.gpt_neox.layers.12.attention/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2159"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="2861" name="Constant_298682" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2862" name="Constant_298687" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2863" name="__module.model.gpt_neox.layers.12.attention/aten::slice/Slice_4" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2153"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="2864" name="__module.model.gpt_neox.layers.12.attention/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2161"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2865" name="self.model.gpt_neox.layers.12.attention.rotary_emb.sin_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="258220060" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.12.attention.rotary_emb.sin_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2866" name="__module.model.gpt_neox.layers.12.attention.rotary_emb/aten::slice/Unsqueeze_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2867" name="__module.model.gpt_neox.layers.12.attention.rotary_emb/aten::slice/Unsqueeze_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2868" name="__module.model.gpt_neox.layers.12.attention.rotary_emb/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2138,2141,sin.49"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2869" name="Constant_38302" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="2870" name="__module.model.gpt_neox.layers.12.attention/aten::index/Gather_1" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="2146"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2871" name="__module.model.gpt_neox.layers.12.attention/aten::unsqueeze/Unsqueeze_1" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="2147,sin.51"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2872" name="__module.model.gpt_neox.layers.12.attention/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2162"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2873" name="__module.model.gpt_neox.layers.12.attention/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2163,2181,2191,query.75,query.77"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2874" name="Constant_7208" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="2119"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2875" name="__module.model.gpt_neox.layers.12.attention/aten::permute/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2120,key.73"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2876" name="Constant_298733" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2877" name="Constant_298736" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2878" name="Constant_298739" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2879" name="__module.model.gpt_neox.layers.12.attention/aten::slice/Slice_6" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2126,k.25"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2880" name="__module.model.gpt_neox.layers.12.attention/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2164"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2881" name="Constant_298743" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2882" name="Constant_298742" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2883" name="__module.model.gpt_neox.layers.12.attention/aten::size/ShapeOf_7" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2884" name="__module.model.gpt_neox.layers.12.attention/aten::size/Constant_7" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="2885" name="__module.model.gpt_neox.layers.12.attention/aten::size/Gather_7" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="2165,2170" /> + </output> + </layer> + <layer id="2886" name="__module.model.gpt_neox.layers.12.attention/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="2887" name="__module.model.gpt_neox.layers.12.attention/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="2167,2168,2172,2173" /> + </output> + </layer> + <layer id="2888" name="Constant_337708" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2889" name="__module.model.gpt_neox.layers.12.attention/aten::slice/Unsqueeze_33" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2890" name="Constant_298741" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2891" name="ScatterUpdate_298744" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2892" name="Constant_298747" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2893" name="Constant_298750" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2894" name="__module.model.gpt_neox.layers.12.attention/aten::slice/Slice_7" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2174,x2.51"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="2895" name="Constant_325315" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2896" name="__module.model.gpt_neox.layers.12.attention/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2175"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="2897" name="Constant_298795" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2898" name="Constant_298800" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2899" name="__module.model.gpt_neox.layers.12.attention/aten::slice/Slice_8" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2169"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="2900" name="__module.model.gpt_neox.layers.12.attention/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2177"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2901" name="__module.model.gpt_neox.layers.12.attention/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2178"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2902" name="__module.model.gpt_neox.layers.12.attention/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2179,2183"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2903" name="__module.model.gpt_neox.layers.12.attention/aten::to/Convert_1" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.12.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2904" name="Constant_432963" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="2905" name="Constant_432956" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2906" name="Constant_432958" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2907" name="Constant_432960" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2908" name="Concat_432961" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2909" name="Broadcast_432964" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2910" name="ReadValue_417300" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.12.valuepresent.12.value" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.12.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2911" name="Constant_401965" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2912" name="Gather_401966" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2913" name="Constant_298845" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2914" name="Constant_298848" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2915" name="Constant_298851" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2916" name="__module.model.gpt_neox.layers.12.attention/aten::slice/Slice_10" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2121"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2917" name="Constant_7222" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="2122"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2918" name="__module.model.gpt_neox.layers.12.attention/aten::permute/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2123"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2919" name="__module.model.gpt_neox.layers.12.attention/aten::cat/Concat_5" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.12.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2920" name="__module.model.gpt_neox.layers.12.attention/aten::slice/Slice_11" type="Const" version="opset1"> + <data element_type="boolean" shape="1, 1, 2048, 2048" offset="259268636" size="4194304" /> + <output> + <port id="0" precision="BOOL" names="2200"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="2921" name="Constant_298855" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="2922" name="Constant_298854" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2923" name="ShapeOf_339011" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2924" name="Constant_339012" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2925" name="Constant_339013" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2926" name="Gather_339014" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" /> + </output> + </layer> + <layer id="2927" name="Add_339015" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="2195" /> + </output> + </layer> + <layer id="2928" name="ShapeOf_339082" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2929" name="Constant_339083" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2930" name="Constant_339084" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2931" name="Gather_339085" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="2193" /> + </output> + </layer> + <layer id="2932" name="__module.model.gpt_neox.layers.12.attention/aten::sub/Subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="2197,2198" /> + </output> + </layer> + <layer id="2933" name="Constant_337710" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2934" name="__module.model.gpt_neox.layers.12.attention/aten::slice/Unsqueeze_44" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2935" name="Constant_298853" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2936" name="ScatterUpdate_298856" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="2937" name="Constant_298857" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="2938" name="Constant_337712" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2939" name="__module.model.gpt_neox.layers.12.attention/aten::slice/Unsqueeze_45" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2940" name="ScatterUpdate_298858" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="2941" name="Constant_298861" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462964" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="2942" name="__module.model.gpt_neox.layers.12.attention/aten::slice/Slice_12" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 0" end_mask="1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + <port id="2" precision="I64"> + <dim>3</dim> + </port> + <port id="3" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="2201"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="2943" name="Constant_298934" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2944" name="Constant_298935" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2945" name="Constant_298931" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2946" name="Constant_298930" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2947" name="ScatterUpdate_298936" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2948" name="Constant_298939" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2949" name="__module.model.gpt_neox.layers.12.attention/aten::slice/Slice_13" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="2202,2203"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="2950" name="__module.model.gpt_neox.layers.12.attention/aten::where/Convert_1" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="2951" name="__module.model.gpt_neox.layers.12.attention/aten::full/Convert" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="263462988" size="4" /> + <output> + <port id="0" precision="FP32" names="2190" /> + </output> + </layer> + <layer id="2952" name="__module.model.gpt_neox.layers.12.attention/aten::where/Select" type="Select" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32" /> + <port id="2" precision="FP32" /> + </input> + <output> + <port id="3" precision="FP32" names="2204,causal_mask.49"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="2953" name="Add_315852" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="2954" name="ShapeOf_315853" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2955" name="Constant_339088" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2956" name="Constant_339089" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2957" name="Gather_339090" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="2188"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2958" name="Constant_268081" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2959" name="Constant_268083" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2960" name="Constant_268085" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2961" name="__module.model.gpt_neox.layers.12.attention/prim::ListConstruct/Concat_1" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="2205"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2962" name="Maximum_315854" type="Maximum" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2963" name="__module.model.gpt_neox.layers.12.attention/aten::add/Add_2" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2207"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="2964" name="__module.model.gpt_neox.layers.12.attention/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2208,2209,sdpa_result.25,tensor.49"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2965" name="Constant_7663" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="2210"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2966" name="__module.model.gpt_neox.layers.12.attention/aten::permute/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2211"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2967" name="__module.model.gpt_neox.layers.12.attention/prim::ListConstruct/Concat_2" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263463020" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="2968" name="__module.model.gpt_neox.layers.12.attention/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2216"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2969" name="self.model.gpt_neox.layers.12.attention.dense.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 4096" offset="2683265156" size="16777216" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2970" name="Convert_449394" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2971" name="self.model.gpt_neox.layers.12.attention.dense.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="2700042372" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2972" name="Convert_449397" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2973" name="self.model.gpt_neox.layers.12.attention.dense.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2974" name="self.model.gpt_neox.layers.12.attention.dense.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="2700046468" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2975" name="self.model.gpt_neox.layers.12.attention.dense.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2976" name="self.model.gpt_neox.layers.12.attention.dense.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2977" name="__module.model.gpt_neox.layers.12.attention.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2978" name="Constant_325316" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="2700054660" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2979" name="__module.model.gpt_neox.layers.12.attention.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2219,2221,input.51"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2980" name="__module.model.gpt_neox.layers.12/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2225,attn_output.51"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2981" name="__module.model.gpt_neox.layers.12.post_attention_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2982" name="__module.model.gpt_neox.layers.12.post_attention_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2983" name="Constant_325317" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="2700071044" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2984" name="__module.model.gpt_neox.layers.12.post_attention_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2985" name="Constant_325318" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="2700087428" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2986" name="__module.model.gpt_neox.layers.12.post_attention_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2229"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2987" name="self.model.gpt_neox.layers.12.mlp.dense_h_to_4h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 4096" offset="2700103812" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2988" name="Convert_449405" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2989" name="self.model.gpt_neox.layers.12.mlp.dense_h_to_4h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 1" offset="2767212676" size="16384" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2990" name="Convert_449408" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2991" name="self.model.gpt_neox.layers.12.mlp.dense_h_to_4h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2992" name="self.model.gpt_neox.layers.12.mlp.dense_h_to_4h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="16384, 1" offset="2767229060" size="32768" /> + <output> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2993" name="self.model.gpt_neox.layers.12.mlp.dense_h_to_4h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2994" name="self.model.gpt_neox.layers.12.mlp.dense_h_to_4h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="2995" name="__module.model.gpt_neox.layers.12.mlp.dense_h_to_4h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="2996" name="Constant_325319" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 16384" offset="2767261828" size="65536" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="2997" name="__module.model.gpt_neox.layers.12.mlp.dense_h_to_4h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2234"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="2998" name="__module.model.gpt_neox.layers.12.mlp.act/aten::gelu/Gelu" type="Gelu" version="opset7"> + <data approximation_mode="ERF" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="2235"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="2999" name="self.model.gpt_neox.layers.12.mlp.dense_4h_to_h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 16384" offset="2767327364" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="3000" name="Convert_449416" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="3001" name="self.model.gpt_neox.layers.12.mlp.dense_4h_to_h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="2834436228" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3002" name="Convert_449419" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3003" name="self.model.gpt_neox.layers.12.mlp.dense_4h_to_h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="3004" name="self.model.gpt_neox.layers.12.mlp.dense_4h_to_h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="2834440324" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3005" name="self.model.gpt_neox.layers.12.mlp.dense_4h_to_h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="3006" name="self.model.gpt_neox.layers.12.mlp.dense_4h_to_h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="3007" name="__module.model.gpt_neox.layers.12.mlp.dense_4h_to_h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3008" name="Constant_325320" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="2834448516" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3009" name="__module.model.gpt_neox.layers.12.mlp.dense_4h_to_h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2238,input.53"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3010" name="__module.model.gpt_neox.layers.12/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2240,2242,hidden_states.27"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3011" name="__module.model.gpt_neox.layers.13.input_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3012" name="__module.model.gpt_neox.layers.13.input_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3013" name="Constant_325321" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="2834464900" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3014" name="__module.model.gpt_neox.layers.13.input_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3015" name="Constant_325322" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="2834481284" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3016" name="__module.model.gpt_neox.layers.13.input_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2252"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3017" name="self.model.gpt_neox.layers.13.attention.query_key_value.weight" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 4096" offset="2834497668" size="50331648" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3018" name="Convert_449427" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3019" name="self.model.gpt_neox.layers.13.attention.query_key_value.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 1" offset="2884829316" size="12288" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3020" name="Convert_449430" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3021" name="self.model.gpt_neox.layers.13.attention.query_key_value.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3022" name="self.model.gpt_neox.layers.13.attention.query_key_value.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="12288, 1" offset="2884841604" size="24576" /> + <output> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3023" name="self.model.gpt_neox.layers.13.attention.query_key_value.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3024" name="self.model.gpt_neox.layers.13.attention.query_key_value.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3025" name="__module.model.gpt_neox.layers.13.attention.query_key_value/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="3026" name="Constant_325323" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 12288" offset="2884866180" size="49152" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="3027" name="__module.model.gpt_neox.layers.13.attention.query_key_value/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2259,qkv.53"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="3028" name="__module.model.gpt_neox.layers.13.attention/prim::ListConstruct/Concat" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171232" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3029" name="__module.model.gpt_neox.layers.13.attention/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2263,qkv.55"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + </output> + </layer> + <layer id="3030" name="Constant_298946" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3031" name="Constant_298949" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3032" name="Constant_298952" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3033" name="__module.model.gpt_neox.layers.13.attention/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2264"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3034" name="Constant_7775" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="2265"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3035" name="__module.model.gpt_neox.layers.13.attention/aten::permute/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2266,query.79"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3036" name="Constant_298958" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3037" name="Constant_298961" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3038" name="Constant_298964" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3039" name="__module.model.gpt_neox.layers.13.attention/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2273,q.27"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3040" name="self.model.gpt_neox.layers.13.attention.rotary_emb.cos_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="257171392" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.13.attention.rotary_emb.cos_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3041" name="__module.model.gpt_neox.layers.13.attention.rotary_emb/aten::slice/Unsqueeze" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3042" name="Constant_298970" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3043" name="Constant_298973" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3044" name="Constant_298976" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3045" name="__module.model.gpt_neox.layers.13.attention/aten::slice/Slice_2" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2267"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3046" name="ShapeOf_339092" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3047" name="Constant_341009" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3048" name="Constant_339094" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3049" name="Gather_339095" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="2277"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3050" name="Constant_432976" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="3051" name="Constant_432969" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3052" name="Constant_432971" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3053" name="Constant_432973" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3054" name="Concat_432974" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3055" name="Broadcast_432977" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3056" name="ReadValue_417302" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.13.keypresent.13.key" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.13.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3057" name="Constant_401968" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3058" name="Gather_401969" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3059" name="ShapeOf_339097" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3060" name="Constant_339098" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3061" name="Constant_339099" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3062" name="Gather_339100" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="2279" /> + </output> + </layer> + <layer id="3063" name="Constant_337714" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3064" name="Reshape_340931" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3065" name="__module.model.gpt_neox.layers.13.attention/aten::add_/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="2278,2282,2283,seq_len.53"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3066" name="__module.model.gpt_neox.layers.13.attention.rotary_emb/aten::slice/Unsqueeze_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3067" name="__module.model.gpt_neox.layers.13.attention.rotary_emb/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2286,2289,cos.53"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3068" name="Constant_38305" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="3069" name="__module.model.gpt_neox.layers.13.attention/aten::index/Gather" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="2292"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3070" name="__module.model.gpt_neox.layers.13.attention/aten::unsqueeze/Unsqueeze" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="2293,cos.55"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3071" name="__module.model.gpt_neox.layers.13.attention/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2297"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3072" name="Constant_298981" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3073" name="Constant_298980" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3074" name="__module.model.gpt_neox.layers.13.attention/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3075" name="__module.model.gpt_neox.layers.13.attention/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="3076" name="__module.model.gpt_neox.layers.13.attention/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="2298,2303" /> + </output> + </layer> + <layer id="3077" name="__module.model.gpt_neox.layers.13.attention/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="3078" name="__module.model.gpt_neox.layers.13.attention/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="2300,2301,2305,2306" /> + </output> + </layer> + <layer id="3079" name="Constant_337716" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3080" name="__module.model.gpt_neox.layers.13.attention/aten::slice/Unsqueeze_17" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3081" name="Constant_298979" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3082" name="ScatterUpdate_298982" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3083" name="Constant_298985" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3084" name="Constant_298988" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3085" name="__module.model.gpt_neox.layers.13.attention/aten::slice/Slice_3" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2307,x2.53"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="3086" name="Constant_325324" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3087" name="__module.model.gpt_neox.layers.13.attention/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2308"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="3088" name="Constant_299033" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3089" name="Constant_299038" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3090" name="__module.model.gpt_neox.layers.13.attention/aten::slice/Slice_4" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2302"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="3091" name="__module.model.gpt_neox.layers.13.attention/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2310"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3092" name="self.model.gpt_neox.layers.13.attention.rotary_emb.sin_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="258220060" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.13.attention.rotary_emb.sin_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3093" name="__module.model.gpt_neox.layers.13.attention.rotary_emb/aten::slice/Unsqueeze_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3094" name="__module.model.gpt_neox.layers.13.attention.rotary_emb/aten::slice/Unsqueeze_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3095" name="__module.model.gpt_neox.layers.13.attention.rotary_emb/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2287,2290,sin.53"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3096" name="Constant_38308" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="3097" name="__module.model.gpt_neox.layers.13.attention/aten::index/Gather_1" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="2295"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3098" name="__module.model.gpt_neox.layers.13.attention/aten::unsqueeze/Unsqueeze_1" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="2296,sin.55"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3099" name="__module.model.gpt_neox.layers.13.attention/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2311"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3100" name="__module.model.gpt_neox.layers.13.attention/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2312,2330,2340,query.81,query.83"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3101" name="Constant_7789" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="2268"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3102" name="__module.model.gpt_neox.layers.13.attention/aten::permute/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2269,key.79"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3103" name="Constant_299084" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3104" name="Constant_299087" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3105" name="Constant_299090" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3106" name="__module.model.gpt_neox.layers.13.attention/aten::slice/Slice_6" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2275,k.27"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3107" name="__module.model.gpt_neox.layers.13.attention/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2313"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3108" name="Constant_299094" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3109" name="Constant_299093" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3110" name="__module.model.gpt_neox.layers.13.attention/aten::size/ShapeOf_7" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3111" name="__module.model.gpt_neox.layers.13.attention/aten::size/Constant_7" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="3112" name="__module.model.gpt_neox.layers.13.attention/aten::size/Gather_7" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="2314,2319" /> + </output> + </layer> + <layer id="3113" name="__module.model.gpt_neox.layers.13.attention/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="3114" name="__module.model.gpt_neox.layers.13.attention/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="2316,2317,2321,2322" /> + </output> + </layer> + <layer id="3115" name="Constant_337718" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3116" name="__module.model.gpt_neox.layers.13.attention/aten::slice/Unsqueeze_33" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3117" name="Constant_299092" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3118" name="ScatterUpdate_299095" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3119" name="Constant_299098" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3120" name="Constant_299101" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3121" name="__module.model.gpt_neox.layers.13.attention/aten::slice/Slice_7" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2323,x2.55"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="3122" name="Constant_325325" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3123" name="__module.model.gpt_neox.layers.13.attention/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2324"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="3124" name="Constant_299146" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3125" name="Constant_299151" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3126" name="__module.model.gpt_neox.layers.13.attention/aten::slice/Slice_8" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2318"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="3127" name="__module.model.gpt_neox.layers.13.attention/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2326"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3128" name="__module.model.gpt_neox.layers.13.attention/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2327"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3129" name="__module.model.gpt_neox.layers.13.attention/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2328,2332"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3130" name="__module.model.gpt_neox.layers.13.attention/aten::to/Convert_1" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.13.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3131" name="Constant_432989" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="3132" name="Constant_432982" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3133" name="Constant_432984" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3134" name="Constant_432986" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3135" name="Concat_432987" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3136" name="Broadcast_432990" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3137" name="ReadValue_417304" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.13.valuepresent.13.value" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.13.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3138" name="Constant_401971" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3139" name="Gather_401972" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3140" name="Constant_299196" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3141" name="Constant_299199" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3142" name="Constant_299202" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3143" name="__module.model.gpt_neox.layers.13.attention/aten::slice/Slice_10" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2270"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3144" name="Constant_7803" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="2271"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3145" name="__module.model.gpt_neox.layers.13.attention/aten::permute/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2272"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3146" name="__module.model.gpt_neox.layers.13.attention/aten::cat/Concat_5" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.13.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3147" name="__module.model.gpt_neox.layers.13.attention/aten::slice/Slice_11" type="Const" version="opset1"> + <data element_type="boolean" shape="1, 1, 2048, 2048" offset="259268636" size="4194304" /> + <output> + <port id="0" precision="BOOL" names="2349"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="3148" name="Constant_299206" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="3149" name="Constant_299205" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3150" name="ShapeOf_339102" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3151" name="Constant_339103" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3152" name="Constant_339104" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3153" name="Gather_339105" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" /> + </output> + </layer> + <layer id="3154" name="Add_339106" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="2344" /> + </output> + </layer> + <layer id="3155" name="ShapeOf_339173" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3156" name="Constant_339174" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3157" name="Constant_339175" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3158" name="Gather_339176" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="2342" /> + </output> + </layer> + <layer id="3159" name="__module.model.gpt_neox.layers.13.attention/aten::sub/Subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="2346,2347" /> + </output> + </layer> + <layer id="3160" name="Constant_337720" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3161" name="__module.model.gpt_neox.layers.13.attention/aten::slice/Unsqueeze_44" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3162" name="Constant_299204" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3163" name="ScatterUpdate_299207" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="3164" name="Constant_299208" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="3165" name="Constant_337722" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3166" name="__module.model.gpt_neox.layers.13.attention/aten::slice/Unsqueeze_45" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3167" name="ScatterUpdate_299209" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="3168" name="Constant_299212" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462964" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="3169" name="__module.model.gpt_neox.layers.13.attention/aten::slice/Slice_12" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 0" end_mask="1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + <port id="2" precision="I64"> + <dim>3</dim> + </port> + <port id="3" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="2350"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="3170" name="Constant_299285" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3171" name="Constant_299286" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3172" name="Constant_299282" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3173" name="Constant_299281" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3174" name="ScatterUpdate_299287" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3175" name="Constant_299290" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3176" name="__module.model.gpt_neox.layers.13.attention/aten::slice/Slice_13" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="2351,2352"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="3177" name="__module.model.gpt_neox.layers.13.attention/aten::where/Convert_1" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="3178" name="__module.model.gpt_neox.layers.13.attention/aten::full/Convert" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="263462988" size="4" /> + <output> + <port id="0" precision="FP32" names="2339" /> + </output> + </layer> + <layer id="3179" name="__module.model.gpt_neox.layers.13.attention/aten::where/Select" type="Select" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32" /> + <port id="2" precision="FP32" /> + </input> + <output> + <port id="3" precision="FP32" names="2353,causal_mask.53"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="3180" name="Add_315924" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="3181" name="ShapeOf_315925" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3182" name="Constant_339179" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3183" name="Constant_339180" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3184" name="Gather_339181" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="2337"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3185" name="Constant_268091" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3186" name="Constant_268093" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3187" name="Constant_268095" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3188" name="__module.model.gpt_neox.layers.13.attention/prim::ListConstruct/Concat_1" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="2354"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3189" name="Maximum_315926" type="Maximum" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3190" name="__module.model.gpt_neox.layers.13.attention/aten::add/Add_2" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2356"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="3191" name="__module.model.gpt_neox.layers.13.attention/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2357,2358,sdpa_result.27,tensor.53"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3192" name="Constant_8244" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="2359"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3193" name="__module.model.gpt_neox.layers.13.attention/aten::permute/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2360"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3194" name="__module.model.gpt_neox.layers.13.attention/prim::ListConstruct/Concat_2" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263463020" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="3195" name="__module.model.gpt_neox.layers.13.attention/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2365"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3196" name="self.model.gpt_neox.layers.13.attention.dense.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 4096" offset="2884915332" size="16777216" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3197" name="Convert_449438" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3198" name="self.model.gpt_neox.layers.13.attention.dense.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="2901692548" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3199" name="Convert_449441" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3200" name="self.model.gpt_neox.layers.13.attention.dense.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3201" name="self.model.gpt_neox.layers.13.attention.dense.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="2901696644" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3202" name="self.model.gpt_neox.layers.13.attention.dense.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3203" name="self.model.gpt_neox.layers.13.attention.dense.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3204" name="__module.model.gpt_neox.layers.13.attention.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3205" name="Constant_325326" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="2901704836" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3206" name="__module.model.gpt_neox.layers.13.attention.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2368,2370,input.55"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3207" name="__module.model.gpt_neox.layers.13/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2374,attn_output.55"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3208" name="__module.model.gpt_neox.layers.13.post_attention_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3209" name="__module.model.gpt_neox.layers.13.post_attention_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3210" name="Constant_325327" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="2901721220" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3211" name="__module.model.gpt_neox.layers.13.post_attention_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3212" name="Constant_325328" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="2901737604" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3213" name="__module.model.gpt_neox.layers.13.post_attention_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2378"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3214" name="self.model.gpt_neox.layers.13.mlp.dense_h_to_4h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 4096" offset="2901753988" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3215" name="Convert_449449" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3216" name="self.model.gpt_neox.layers.13.mlp.dense_h_to_4h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 1" offset="2968862852" size="16384" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3217" name="Convert_449452" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3218" name="self.model.gpt_neox.layers.13.mlp.dense_h_to_4h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3219" name="self.model.gpt_neox.layers.13.mlp.dense_h_to_4h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="16384, 1" offset="2968879236" size="32768" /> + <output> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3220" name="self.model.gpt_neox.layers.13.mlp.dense_h_to_4h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3221" name="self.model.gpt_neox.layers.13.mlp.dense_h_to_4h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3222" name="__module.model.gpt_neox.layers.13.mlp.dense_h_to_4h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="3223" name="Constant_325329" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 16384" offset="2968912004" size="65536" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="3224" name="__module.model.gpt_neox.layers.13.mlp.dense_h_to_4h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2383"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="3225" name="__module.model.gpt_neox.layers.13.mlp.act/aten::gelu/Gelu" type="Gelu" version="opset7"> + <data approximation_mode="ERF" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="2384"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="3226" name="self.model.gpt_neox.layers.13.mlp.dense_4h_to_h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 16384" offset="2968977540" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="3227" name="Convert_449460" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="3228" name="self.model.gpt_neox.layers.13.mlp.dense_4h_to_h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="3036086404" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3229" name="Convert_449463" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3230" name="self.model.gpt_neox.layers.13.mlp.dense_4h_to_h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="3231" name="self.model.gpt_neox.layers.13.mlp.dense_4h_to_h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="3036090500" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3232" name="self.model.gpt_neox.layers.13.mlp.dense_4h_to_h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="3233" name="self.model.gpt_neox.layers.13.mlp.dense_4h_to_h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="3234" name="__module.model.gpt_neox.layers.13.mlp.dense_4h_to_h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3235" name="Constant_325330" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="3036098692" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3236" name="__module.model.gpt_neox.layers.13.mlp.dense_4h_to_h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2387,input.57"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3237" name="__module.model.gpt_neox.layers.13/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2389,2391,hidden_states.29"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3238" name="__module.model.gpt_neox.layers.14.input_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3239" name="__module.model.gpt_neox.layers.14.input_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3240" name="Constant_325331" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="3036115076" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3241" name="__module.model.gpt_neox.layers.14.input_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3242" name="Constant_325332" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="3036131460" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3243" name="__module.model.gpt_neox.layers.14.input_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2401"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3244" name="self.model.gpt_neox.layers.14.attention.query_key_value.weight" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 4096" offset="3036147844" size="50331648" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3245" name="Convert_449471" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3246" name="self.model.gpt_neox.layers.14.attention.query_key_value.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 1" offset="3086479492" size="12288" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3247" name="Convert_449474" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3248" name="self.model.gpt_neox.layers.14.attention.query_key_value.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3249" name="self.model.gpt_neox.layers.14.attention.query_key_value.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="12288, 1" offset="3086491780" size="24576" /> + <output> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3250" name="self.model.gpt_neox.layers.14.attention.query_key_value.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3251" name="self.model.gpt_neox.layers.14.attention.query_key_value.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3252" name="__module.model.gpt_neox.layers.14.attention.query_key_value/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="3253" name="Constant_325333" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 12288" offset="3086516356" size="49152" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="3254" name="__module.model.gpt_neox.layers.14.attention.query_key_value/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2408,qkv.57"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="3255" name="__module.model.gpt_neox.layers.14.attention/prim::ListConstruct/Concat" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171232" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3256" name="__module.model.gpt_neox.layers.14.attention/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2412,qkv.59"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + </output> + </layer> + <layer id="3257" name="Constant_299297" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3258" name="Constant_299300" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3259" name="Constant_299303" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3260" name="__module.model.gpt_neox.layers.14.attention/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2413"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3261" name="Constant_8356" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="2414"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3262" name="__module.model.gpt_neox.layers.14.attention/aten::permute/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2415,query.85"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3263" name="Constant_299309" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3264" name="Constant_299312" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3265" name="Constant_299315" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3266" name="__module.model.gpt_neox.layers.14.attention/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2422,q.29"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3267" name="self.model.gpt_neox.layers.14.attention.rotary_emb.cos_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="257171392" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.14.attention.rotary_emb.cos_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3268" name="__module.model.gpt_neox.layers.14.attention.rotary_emb/aten::slice/Unsqueeze" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3269" name="Constant_299321" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3270" name="Constant_299324" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3271" name="Constant_299327" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3272" name="__module.model.gpt_neox.layers.14.attention/aten::slice/Slice_2" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2416"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3273" name="ShapeOf_339183" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3274" name="Constant_341012" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3275" name="Constant_339185" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3276" name="Gather_339186" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="2426"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3277" name="Constant_433002" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="3278" name="Constant_432995" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3279" name="Constant_432997" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3280" name="Constant_432999" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3281" name="Concat_433000" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3282" name="Broadcast_433003" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3283" name="ReadValue_417306" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.14.keypresent.14.key" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.14.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3284" name="Constant_401974" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3285" name="Gather_401975" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3286" name="ShapeOf_339188" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3287" name="Constant_339189" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3288" name="Constant_339190" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3289" name="Gather_339191" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="2428" /> + </output> + </layer> + <layer id="3290" name="Constant_337724" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3291" name="Reshape_340933" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3292" name="__module.model.gpt_neox.layers.14.attention/aten::add_/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="2427,2431,2432,seq_len.57"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3293" name="__module.model.gpt_neox.layers.14.attention.rotary_emb/aten::slice/Unsqueeze_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3294" name="__module.model.gpt_neox.layers.14.attention.rotary_emb/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2435,2438,cos.57"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3295" name="Constant_38311" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="3296" name="__module.model.gpt_neox.layers.14.attention/aten::index/Gather" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="2441"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3297" name="__module.model.gpt_neox.layers.14.attention/aten::unsqueeze/Unsqueeze" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="2442,cos.59"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3298" name="__module.model.gpt_neox.layers.14.attention/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2446"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3299" name="Constant_299332" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3300" name="Constant_299331" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3301" name="__module.model.gpt_neox.layers.14.attention/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3302" name="__module.model.gpt_neox.layers.14.attention/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="3303" name="__module.model.gpt_neox.layers.14.attention/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="2447,2452" /> + </output> + </layer> + <layer id="3304" name="__module.model.gpt_neox.layers.14.attention/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="3305" name="__module.model.gpt_neox.layers.14.attention/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="2449,2450,2454,2455" /> + </output> + </layer> + <layer id="3306" name="Constant_337726" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3307" name="__module.model.gpt_neox.layers.14.attention/aten::slice/Unsqueeze_17" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3308" name="Constant_299330" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3309" name="ScatterUpdate_299333" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3310" name="Constant_299336" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3311" name="Constant_299339" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3312" name="__module.model.gpt_neox.layers.14.attention/aten::slice/Slice_3" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2456,x2.57"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="3313" name="Constant_325334" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3314" name="__module.model.gpt_neox.layers.14.attention/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2457"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="3315" name="Constant_299384" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3316" name="Constant_299389" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3317" name="__module.model.gpt_neox.layers.14.attention/aten::slice/Slice_4" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2451"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="3318" name="__module.model.gpt_neox.layers.14.attention/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2459"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3319" name="self.model.gpt_neox.layers.14.attention.rotary_emb.sin_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="258220060" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.14.attention.rotary_emb.sin_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3320" name="__module.model.gpt_neox.layers.14.attention.rotary_emb/aten::slice/Unsqueeze_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3321" name="__module.model.gpt_neox.layers.14.attention.rotary_emb/aten::slice/Unsqueeze_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3322" name="__module.model.gpt_neox.layers.14.attention.rotary_emb/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2436,2439,sin.57"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3323" name="Constant_38314" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="3324" name="__module.model.gpt_neox.layers.14.attention/aten::index/Gather_1" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="2444"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3325" name="__module.model.gpt_neox.layers.14.attention/aten::unsqueeze/Unsqueeze_1" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="2445,sin.59"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3326" name="__module.model.gpt_neox.layers.14.attention/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2460"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3327" name="__module.model.gpt_neox.layers.14.attention/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2461,2479,2489,query.87,query.89"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3328" name="Constant_8370" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="2417"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3329" name="__module.model.gpt_neox.layers.14.attention/aten::permute/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2418,key.85"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3330" name="Constant_299435" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3331" name="Constant_299438" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3332" name="Constant_299441" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3333" name="__module.model.gpt_neox.layers.14.attention/aten::slice/Slice_6" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2424,k.29"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3334" name="__module.model.gpt_neox.layers.14.attention/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2462"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3335" name="Constant_299445" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3336" name="Constant_299444" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3337" name="__module.model.gpt_neox.layers.14.attention/aten::size/ShapeOf_7" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3338" name="__module.model.gpt_neox.layers.14.attention/aten::size/Constant_7" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="3339" name="__module.model.gpt_neox.layers.14.attention/aten::size/Gather_7" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="2463,2468" /> + </output> + </layer> + <layer id="3340" name="__module.model.gpt_neox.layers.14.attention/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="3341" name="__module.model.gpt_neox.layers.14.attention/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="2465,2466,2470,2471" /> + </output> + </layer> + <layer id="3342" name="Constant_337728" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3343" name="__module.model.gpt_neox.layers.14.attention/aten::slice/Unsqueeze_33" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3344" name="Constant_299443" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3345" name="ScatterUpdate_299446" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3346" name="Constant_299449" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3347" name="Constant_299452" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3348" name="__module.model.gpt_neox.layers.14.attention/aten::slice/Slice_7" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2472,x2.59"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="3349" name="Constant_325335" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3350" name="__module.model.gpt_neox.layers.14.attention/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2473"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="3351" name="Constant_299497" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3352" name="Constant_299502" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3353" name="__module.model.gpt_neox.layers.14.attention/aten::slice/Slice_8" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2467"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="3354" name="__module.model.gpt_neox.layers.14.attention/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2475"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3355" name="__module.model.gpt_neox.layers.14.attention/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2476"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3356" name="__module.model.gpt_neox.layers.14.attention/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2477,2481"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3357" name="__module.model.gpt_neox.layers.14.attention/aten::to/Convert_1" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.14.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3358" name="Constant_433015" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="3359" name="Constant_433008" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3360" name="Constant_433010" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3361" name="Constant_433012" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3362" name="Concat_433013" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3363" name="Broadcast_433016" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3364" name="ReadValue_417308" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.14.valuepresent.14.value" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.14.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3365" name="Constant_401977" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3366" name="Gather_401978" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3367" name="Constant_299547" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3368" name="Constant_299550" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3369" name="Constant_299553" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3370" name="__module.model.gpt_neox.layers.14.attention/aten::slice/Slice_10" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2419"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3371" name="Constant_8384" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="2420"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3372" name="__module.model.gpt_neox.layers.14.attention/aten::permute/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2421"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3373" name="__module.model.gpt_neox.layers.14.attention/aten::cat/Concat_5" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.14.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3374" name="__module.model.gpt_neox.layers.14.attention/aten::slice/Slice_11" type="Const" version="opset1"> + <data element_type="boolean" shape="1, 1, 2048, 2048" offset="259268636" size="4194304" /> + <output> + <port id="0" precision="BOOL" names="2498"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="3375" name="Constant_299557" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="3376" name="Constant_299556" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3377" name="ShapeOf_339193" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3378" name="Constant_339194" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3379" name="Constant_339195" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3380" name="Gather_339196" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" /> + </output> + </layer> + <layer id="3381" name="Add_339197" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="2493" /> + </output> + </layer> + <layer id="3382" name="ShapeOf_339264" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3383" name="Constant_339265" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3384" name="Constant_339266" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3385" name="Gather_339267" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="2491" /> + </output> + </layer> + <layer id="3386" name="__module.model.gpt_neox.layers.14.attention/aten::sub/Subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="2495,2496" /> + </output> + </layer> + <layer id="3387" name="Constant_337730" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3388" name="__module.model.gpt_neox.layers.14.attention/aten::slice/Unsqueeze_44" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3389" name="Constant_299555" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3390" name="ScatterUpdate_299558" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="3391" name="Constant_299559" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="3392" name="Constant_337732" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3393" name="__module.model.gpt_neox.layers.14.attention/aten::slice/Unsqueeze_45" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3394" name="ScatterUpdate_299560" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="3395" name="Constant_299563" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462964" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="3396" name="__module.model.gpt_neox.layers.14.attention/aten::slice/Slice_12" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 0" end_mask="1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + <port id="2" precision="I64"> + <dim>3</dim> + </port> + <port id="3" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="2499"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="3397" name="Constant_299636" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3398" name="Constant_299637" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3399" name="Constant_299633" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3400" name="Constant_299632" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3401" name="ScatterUpdate_299638" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3402" name="Constant_299641" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3403" name="__module.model.gpt_neox.layers.14.attention/aten::slice/Slice_13" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="2500,2501"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="3404" name="__module.model.gpt_neox.layers.14.attention/aten::where/Convert_1" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="3405" name="__module.model.gpt_neox.layers.14.attention/aten::full/Convert" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="263462988" size="4" /> + <output> + <port id="0" precision="FP32" names="2488" /> + </output> + </layer> + <layer id="3406" name="__module.model.gpt_neox.layers.14.attention/aten::where/Select" type="Select" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32" /> + <port id="2" precision="FP32" /> + </input> + <output> + <port id="3" precision="FP32" names="2502,causal_mask.57"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="3407" name="Add_315996" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="3408" name="ShapeOf_315997" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3409" name="Constant_339270" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3410" name="Constant_339271" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3411" name="Gather_339272" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="2486"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3412" name="Constant_268101" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3413" name="Constant_268103" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3414" name="Constant_268105" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3415" name="__module.model.gpt_neox.layers.14.attention/prim::ListConstruct/Concat_1" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="2503"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3416" name="Maximum_315998" type="Maximum" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3417" name="__module.model.gpt_neox.layers.14.attention/aten::add/Add_2" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2505"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="3418" name="__module.model.gpt_neox.layers.14.attention/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2506,2507,sdpa_result.29,tensor.57"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3419" name="Constant_8825" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="2508"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3420" name="__module.model.gpt_neox.layers.14.attention/aten::permute/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2509"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3421" name="__module.model.gpt_neox.layers.14.attention/prim::ListConstruct/Concat_2" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263463020" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="3422" name="__module.model.gpt_neox.layers.14.attention/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2514"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3423" name="self.model.gpt_neox.layers.14.attention.dense.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 4096" offset="3086565508" size="16777216" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3424" name="Convert_449482" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3425" name="self.model.gpt_neox.layers.14.attention.dense.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="3103342724" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3426" name="Convert_449485" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3427" name="self.model.gpt_neox.layers.14.attention.dense.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3428" name="self.model.gpt_neox.layers.14.attention.dense.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="3103346820" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3429" name="self.model.gpt_neox.layers.14.attention.dense.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3430" name="self.model.gpt_neox.layers.14.attention.dense.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3431" name="__module.model.gpt_neox.layers.14.attention.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3432" name="Constant_325336" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="3103355012" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3433" name="__module.model.gpt_neox.layers.14.attention.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2517,2519,input.59"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3434" name="__module.model.gpt_neox.layers.14/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2523,attn_output.59"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3435" name="__module.model.gpt_neox.layers.14.post_attention_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3436" name="__module.model.gpt_neox.layers.14.post_attention_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3437" name="Constant_325337" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="3103371396" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3438" name="__module.model.gpt_neox.layers.14.post_attention_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3439" name="Constant_325338" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="3103387780" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3440" name="__module.model.gpt_neox.layers.14.post_attention_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2527"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3441" name="self.model.gpt_neox.layers.14.mlp.dense_h_to_4h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 4096" offset="3103404164" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3442" name="Convert_449493" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3443" name="self.model.gpt_neox.layers.14.mlp.dense_h_to_4h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 1" offset="3170513028" size="16384" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3444" name="Convert_449496" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3445" name="self.model.gpt_neox.layers.14.mlp.dense_h_to_4h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3446" name="self.model.gpt_neox.layers.14.mlp.dense_h_to_4h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="16384, 1" offset="3170529412" size="32768" /> + <output> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3447" name="self.model.gpt_neox.layers.14.mlp.dense_h_to_4h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3448" name="self.model.gpt_neox.layers.14.mlp.dense_h_to_4h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3449" name="__module.model.gpt_neox.layers.14.mlp.dense_h_to_4h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="3450" name="Constant_325339" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 16384" offset="3170562180" size="65536" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="3451" name="__module.model.gpt_neox.layers.14.mlp.dense_h_to_4h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2532"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="3452" name="__module.model.gpt_neox.layers.14.mlp.act/aten::gelu/Gelu" type="Gelu" version="opset7"> + <data approximation_mode="ERF" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="2533"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="3453" name="self.model.gpt_neox.layers.14.mlp.dense_4h_to_h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 16384" offset="3170627716" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="3454" name="Convert_449504" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="3455" name="self.model.gpt_neox.layers.14.mlp.dense_4h_to_h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="3237736580" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3456" name="Convert_449507" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3457" name="self.model.gpt_neox.layers.14.mlp.dense_4h_to_h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="3458" name="self.model.gpt_neox.layers.14.mlp.dense_4h_to_h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="3237740676" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3459" name="self.model.gpt_neox.layers.14.mlp.dense_4h_to_h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="3460" name="self.model.gpt_neox.layers.14.mlp.dense_4h_to_h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="3461" name="__module.model.gpt_neox.layers.14.mlp.dense_4h_to_h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3462" name="Constant_325340" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="3237748868" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3463" name="__module.model.gpt_neox.layers.14.mlp.dense_4h_to_h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2536,input.61"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3464" name="__module.model.gpt_neox.layers.14/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2538,2540,hidden_states.31"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3465" name="__module.model.gpt_neox.layers.15.input_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3466" name="__module.model.gpt_neox.layers.15.input_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3467" name="Constant_325341" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="3237765252" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3468" name="__module.model.gpt_neox.layers.15.input_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3469" name="Constant_325342" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="3237781636" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3470" name="__module.model.gpt_neox.layers.15.input_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2550"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3471" name="self.model.gpt_neox.layers.15.attention.query_key_value.weight" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 4096" offset="3237798020" size="50331648" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3472" name="Convert_449515" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3473" name="self.model.gpt_neox.layers.15.attention.query_key_value.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 1" offset="3288129668" size="12288" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3474" name="Convert_449518" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3475" name="self.model.gpt_neox.layers.15.attention.query_key_value.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3476" name="self.model.gpt_neox.layers.15.attention.query_key_value.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="12288, 1" offset="3288141956" size="24576" /> + <output> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3477" name="self.model.gpt_neox.layers.15.attention.query_key_value.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3478" name="self.model.gpt_neox.layers.15.attention.query_key_value.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3479" name="__module.model.gpt_neox.layers.15.attention.query_key_value/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="3480" name="Constant_325343" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 12288" offset="3288166532" size="49152" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="3481" name="__module.model.gpt_neox.layers.15.attention.query_key_value/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2557,qkv.61"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="3482" name="__module.model.gpt_neox.layers.15.attention/prim::ListConstruct/Concat" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171232" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3483" name="__module.model.gpt_neox.layers.15.attention/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2561,qkv.63"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + </output> + </layer> + <layer id="3484" name="Constant_299648" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3485" name="Constant_299651" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3486" name="Constant_299654" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3487" name="__module.model.gpt_neox.layers.15.attention/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2562"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3488" name="Constant_8937" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="2563"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3489" name="__module.model.gpt_neox.layers.15.attention/aten::permute/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2564,query.91"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3490" name="Constant_299660" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3491" name="Constant_299663" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3492" name="Constant_299666" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3493" name="__module.model.gpt_neox.layers.15.attention/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2571,q.31"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3494" name="self.model.gpt_neox.layers.15.attention.rotary_emb.cos_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="257171392" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.15.attention.rotary_emb.cos_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3495" name="__module.model.gpt_neox.layers.15.attention.rotary_emb/aten::slice/Unsqueeze" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3496" name="Constant_299672" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3497" name="Constant_299675" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3498" name="Constant_299678" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3499" name="__module.model.gpt_neox.layers.15.attention/aten::slice/Slice_2" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2565"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3500" name="ShapeOf_339274" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3501" name="Constant_341015" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3502" name="Constant_339276" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3503" name="Gather_339277" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="2575"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3504" name="Constant_433028" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="3505" name="Constant_433021" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3506" name="Constant_433023" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3507" name="Constant_433025" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3508" name="Concat_433026" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3509" name="Broadcast_433029" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3510" name="ReadValue_417310" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.15.keypresent.15.key" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.15.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3511" name="Constant_401980" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3512" name="Gather_401981" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3513" name="ShapeOf_339279" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3514" name="Constant_339280" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3515" name="Constant_339281" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3516" name="Gather_339282" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="2577" /> + </output> + </layer> + <layer id="3517" name="Constant_337734" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3518" name="Reshape_340935" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3519" name="__module.model.gpt_neox.layers.15.attention/aten::add_/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="2576,2580,2581,seq_len.61"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3520" name="__module.model.gpt_neox.layers.15.attention.rotary_emb/aten::slice/Unsqueeze_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3521" name="__module.model.gpt_neox.layers.15.attention.rotary_emb/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2584,2587,cos.61"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3522" name="Constant_38317" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="3523" name="__module.model.gpt_neox.layers.15.attention/aten::index/Gather" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="2590"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3524" name="__module.model.gpt_neox.layers.15.attention/aten::unsqueeze/Unsqueeze" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="2591,cos.63"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3525" name="__module.model.gpt_neox.layers.15.attention/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2595"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3526" name="Constant_299683" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3527" name="Constant_299682" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3528" name="__module.model.gpt_neox.layers.15.attention/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3529" name="__module.model.gpt_neox.layers.15.attention/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="3530" name="__module.model.gpt_neox.layers.15.attention/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="2596,2601" /> + </output> + </layer> + <layer id="3531" name="__module.model.gpt_neox.layers.15.attention/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="3532" name="__module.model.gpt_neox.layers.15.attention/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="2598,2599,2603,2604" /> + </output> + </layer> + <layer id="3533" name="Constant_337736" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3534" name="__module.model.gpt_neox.layers.15.attention/aten::slice/Unsqueeze_17" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3535" name="Constant_299681" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3536" name="ScatterUpdate_299684" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3537" name="Constant_299687" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3538" name="Constant_299690" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3539" name="__module.model.gpt_neox.layers.15.attention/aten::slice/Slice_3" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2605,x2.61"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="3540" name="Constant_325344" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3541" name="__module.model.gpt_neox.layers.15.attention/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2606"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="3542" name="Constant_299735" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3543" name="Constant_299740" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3544" name="__module.model.gpt_neox.layers.15.attention/aten::slice/Slice_4" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2600"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="3545" name="__module.model.gpt_neox.layers.15.attention/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2608"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3546" name="self.model.gpt_neox.layers.15.attention.rotary_emb.sin_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="258220060" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.15.attention.rotary_emb.sin_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3547" name="__module.model.gpt_neox.layers.15.attention.rotary_emb/aten::slice/Unsqueeze_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3548" name="__module.model.gpt_neox.layers.15.attention.rotary_emb/aten::slice/Unsqueeze_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3549" name="__module.model.gpt_neox.layers.15.attention.rotary_emb/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2585,2588,sin.61"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3550" name="Constant_38320" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="3551" name="__module.model.gpt_neox.layers.15.attention/aten::index/Gather_1" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="2593"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3552" name="__module.model.gpt_neox.layers.15.attention/aten::unsqueeze/Unsqueeze_1" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="2594,sin.63"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3553" name="__module.model.gpt_neox.layers.15.attention/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2609"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3554" name="__module.model.gpt_neox.layers.15.attention/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2610,2628,2638,query.93,query.95"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3555" name="Constant_8951" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="2566"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3556" name="__module.model.gpt_neox.layers.15.attention/aten::permute/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2567,key.91"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3557" name="Constant_299786" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3558" name="Constant_299789" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3559" name="Constant_299792" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3560" name="__module.model.gpt_neox.layers.15.attention/aten::slice/Slice_6" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2573,k.31"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3561" name="__module.model.gpt_neox.layers.15.attention/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2611"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3562" name="Constant_299796" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3563" name="Constant_299795" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3564" name="__module.model.gpt_neox.layers.15.attention/aten::size/ShapeOf_7" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3565" name="__module.model.gpt_neox.layers.15.attention/aten::size/Constant_7" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="3566" name="__module.model.gpt_neox.layers.15.attention/aten::size/Gather_7" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="2612,2617" /> + </output> + </layer> + <layer id="3567" name="__module.model.gpt_neox.layers.15.attention/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="3568" name="__module.model.gpt_neox.layers.15.attention/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="2614,2615,2619,2620" /> + </output> + </layer> + <layer id="3569" name="Constant_337738" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3570" name="__module.model.gpt_neox.layers.15.attention/aten::slice/Unsqueeze_33" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3571" name="Constant_299794" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3572" name="ScatterUpdate_299797" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3573" name="Constant_299800" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3574" name="Constant_299803" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3575" name="__module.model.gpt_neox.layers.15.attention/aten::slice/Slice_7" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2621,x2.63"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="3576" name="Constant_325345" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3577" name="__module.model.gpt_neox.layers.15.attention/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2622"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="3578" name="Constant_299848" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3579" name="Constant_299853" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3580" name="__module.model.gpt_neox.layers.15.attention/aten::slice/Slice_8" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2616"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="3581" name="__module.model.gpt_neox.layers.15.attention/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2624"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3582" name="__module.model.gpt_neox.layers.15.attention/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2625"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3583" name="__module.model.gpt_neox.layers.15.attention/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2626,2630"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3584" name="__module.model.gpt_neox.layers.15.attention/aten::to/Convert_1" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.15.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3585" name="Constant_433041" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="3586" name="Constant_433034" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3587" name="Constant_433036" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3588" name="Constant_433038" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3589" name="Concat_433039" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3590" name="Broadcast_433042" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3591" name="ReadValue_417312" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.15.valuepresent.15.value" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.15.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3592" name="Constant_401983" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3593" name="Gather_401984" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3594" name="Constant_299898" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3595" name="Constant_299901" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3596" name="Constant_299904" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3597" name="__module.model.gpt_neox.layers.15.attention/aten::slice/Slice_10" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2568"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3598" name="Constant_8965" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="2569"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3599" name="__module.model.gpt_neox.layers.15.attention/aten::permute/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2570"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3600" name="__module.model.gpt_neox.layers.15.attention/aten::cat/Concat_5" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.15.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3601" name="__module.model.gpt_neox.layers.15.attention/aten::slice/Slice_11" type="Const" version="opset1"> + <data element_type="boolean" shape="1, 1, 2048, 2048" offset="259268636" size="4194304" /> + <output> + <port id="0" precision="BOOL" names="2647"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="3602" name="Constant_299908" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="3603" name="Constant_299907" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3604" name="ShapeOf_339284" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3605" name="Constant_339285" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3606" name="Constant_339286" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3607" name="Gather_339287" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" /> + </output> + </layer> + <layer id="3608" name="Add_339288" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="2642" /> + </output> + </layer> + <layer id="3609" name="ShapeOf_339355" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3610" name="Constant_339356" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3611" name="Constant_339357" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3612" name="Gather_339358" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="2640" /> + </output> + </layer> + <layer id="3613" name="__module.model.gpt_neox.layers.15.attention/aten::sub/Subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="2644,2645" /> + </output> + </layer> + <layer id="3614" name="Constant_337740" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3615" name="__module.model.gpt_neox.layers.15.attention/aten::slice/Unsqueeze_44" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3616" name="Constant_299906" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3617" name="ScatterUpdate_299909" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="3618" name="Constant_299910" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="3619" name="Constant_337742" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3620" name="__module.model.gpt_neox.layers.15.attention/aten::slice/Unsqueeze_45" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3621" name="ScatterUpdate_299911" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="3622" name="Constant_299914" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462964" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="3623" name="__module.model.gpt_neox.layers.15.attention/aten::slice/Slice_12" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 0" end_mask="1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + <port id="2" precision="I64"> + <dim>3</dim> + </port> + <port id="3" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="2648"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="3624" name="Constant_299987" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3625" name="Constant_299988" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3626" name="Constant_299984" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3627" name="Constant_299983" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3628" name="ScatterUpdate_299989" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3629" name="Constant_299992" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3630" name="__module.model.gpt_neox.layers.15.attention/aten::slice/Slice_13" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="2649,2650"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="3631" name="__module.model.gpt_neox.layers.15.attention/aten::where/Convert_1" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="3632" name="__module.model.gpt_neox.layers.15.attention/aten::full/Convert" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="263462988" size="4" /> + <output> + <port id="0" precision="FP32" names="2637" /> + </output> + </layer> + <layer id="3633" name="__module.model.gpt_neox.layers.15.attention/aten::where/Select" type="Select" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32" /> + <port id="2" precision="FP32" /> + </input> + <output> + <port id="3" precision="FP32" names="2651,causal_mask.61"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="3634" name="Add_316068" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="3635" name="ShapeOf_316069" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3636" name="Constant_339361" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3637" name="Constant_339362" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3638" name="Gather_339363" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="2635"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3639" name="Constant_268111" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3640" name="Constant_268113" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3641" name="Constant_268115" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3642" name="__module.model.gpt_neox.layers.15.attention/prim::ListConstruct/Concat_1" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="2652"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3643" name="Maximum_316070" type="Maximum" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3644" name="__module.model.gpt_neox.layers.15.attention/aten::add/Add_2" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2654"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="3645" name="__module.model.gpt_neox.layers.15.attention/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2655,2656,sdpa_result.31,tensor.61"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3646" name="Constant_9406" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="2657"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3647" name="__module.model.gpt_neox.layers.15.attention/aten::permute/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2658"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3648" name="__module.model.gpt_neox.layers.15.attention/prim::ListConstruct/Concat_2" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263463020" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="3649" name="__module.model.gpt_neox.layers.15.attention/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2663"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3650" name="self.model.gpt_neox.layers.15.attention.dense.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 4096" offset="3288215684" size="16777216" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3651" name="Convert_449526" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3652" name="self.model.gpt_neox.layers.15.attention.dense.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="3304992900" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3653" name="Convert_449529" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3654" name="self.model.gpt_neox.layers.15.attention.dense.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3655" name="self.model.gpt_neox.layers.15.attention.dense.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="3304996996" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3656" name="self.model.gpt_neox.layers.15.attention.dense.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3657" name="self.model.gpt_neox.layers.15.attention.dense.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3658" name="__module.model.gpt_neox.layers.15.attention.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3659" name="Constant_325346" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="3305005188" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3660" name="__module.model.gpt_neox.layers.15.attention.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2666,2668,input.63"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3661" name="__module.model.gpt_neox.layers.15/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2672,attn_output.63"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3662" name="__module.model.gpt_neox.layers.15.post_attention_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3663" name="__module.model.gpt_neox.layers.15.post_attention_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3664" name="Constant_325347" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="3305021572" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3665" name="__module.model.gpt_neox.layers.15.post_attention_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3666" name="Constant_325348" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="3305037956" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3667" name="__module.model.gpt_neox.layers.15.post_attention_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2676"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3668" name="self.model.gpt_neox.layers.15.mlp.dense_h_to_4h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 4096" offset="3305054340" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3669" name="Convert_449537" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3670" name="self.model.gpt_neox.layers.15.mlp.dense_h_to_4h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 1" offset="3372163204" size="16384" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3671" name="Convert_449540" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3672" name="self.model.gpt_neox.layers.15.mlp.dense_h_to_4h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3673" name="self.model.gpt_neox.layers.15.mlp.dense_h_to_4h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="16384, 1" offset="3372179588" size="32768" /> + <output> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3674" name="self.model.gpt_neox.layers.15.mlp.dense_h_to_4h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3675" name="self.model.gpt_neox.layers.15.mlp.dense_h_to_4h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3676" name="__module.model.gpt_neox.layers.15.mlp.dense_h_to_4h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="3677" name="Constant_325349" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 16384" offset="3372212356" size="65536" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="3678" name="__module.model.gpt_neox.layers.15.mlp.dense_h_to_4h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2681"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="3679" name="__module.model.gpt_neox.layers.15.mlp.act/aten::gelu/Gelu" type="Gelu" version="opset7"> + <data approximation_mode="ERF" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="2682"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="3680" name="self.model.gpt_neox.layers.15.mlp.dense_4h_to_h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 16384" offset="3372277892" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="3681" name="Convert_449548" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="3682" name="self.model.gpt_neox.layers.15.mlp.dense_4h_to_h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="3439386756" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3683" name="Convert_449551" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3684" name="self.model.gpt_neox.layers.15.mlp.dense_4h_to_h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="3685" name="self.model.gpt_neox.layers.15.mlp.dense_4h_to_h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="3439390852" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3686" name="self.model.gpt_neox.layers.15.mlp.dense_4h_to_h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="3687" name="self.model.gpt_neox.layers.15.mlp.dense_4h_to_h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="3688" name="__module.model.gpt_neox.layers.15.mlp.dense_4h_to_h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3689" name="Constant_325350" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="3439399044" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3690" name="__module.model.gpt_neox.layers.15.mlp.dense_4h_to_h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2685,input.65"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3691" name="__module.model.gpt_neox.layers.15/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2687,2689,hidden_states.33"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3692" name="__module.model.gpt_neox.layers.16.input_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3693" name="__module.model.gpt_neox.layers.16.input_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3694" name="Constant_325351" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="3439415428" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3695" name="__module.model.gpt_neox.layers.16.input_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3696" name="Constant_325352" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="3439431812" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3697" name="__module.model.gpt_neox.layers.16.input_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2699"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3698" name="self.model.gpt_neox.layers.16.attention.query_key_value.weight" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 4096" offset="3439448196" size="50331648" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3699" name="Convert_449559" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3700" name="self.model.gpt_neox.layers.16.attention.query_key_value.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 1" offset="3489779844" size="12288" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3701" name="Convert_449562" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3702" name="self.model.gpt_neox.layers.16.attention.query_key_value.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3703" name="self.model.gpt_neox.layers.16.attention.query_key_value.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="12288, 1" offset="3489792132" size="24576" /> + <output> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3704" name="self.model.gpt_neox.layers.16.attention.query_key_value.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3705" name="self.model.gpt_neox.layers.16.attention.query_key_value.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3706" name="__module.model.gpt_neox.layers.16.attention.query_key_value/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="3707" name="Constant_325353" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 12288" offset="3489816708" size="49152" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="3708" name="__module.model.gpt_neox.layers.16.attention.query_key_value/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2706,qkv.65"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="3709" name="__module.model.gpt_neox.layers.16.attention/prim::ListConstruct/Concat" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171232" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3710" name="__module.model.gpt_neox.layers.16.attention/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2710,qkv.67"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + </output> + </layer> + <layer id="3711" name="Constant_299999" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3712" name="Constant_300002" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3713" name="Constant_300005" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3714" name="__module.model.gpt_neox.layers.16.attention/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2711"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3715" name="Constant_9518" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="2712"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3716" name="__module.model.gpt_neox.layers.16.attention/aten::permute/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2713,query.97"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3717" name="Constant_300011" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3718" name="Constant_300014" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3719" name="Constant_300017" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3720" name="__module.model.gpt_neox.layers.16.attention/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2720,q.33"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3721" name="self.model.gpt_neox.layers.16.attention.rotary_emb.cos_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="257171392" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.16.attention.rotary_emb.cos_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3722" name="__module.model.gpt_neox.layers.16.attention.rotary_emb/aten::slice/Unsqueeze" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3723" name="Constant_300023" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3724" name="Constant_300026" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3725" name="Constant_300029" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3726" name="__module.model.gpt_neox.layers.16.attention/aten::slice/Slice_2" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2714"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3727" name="ShapeOf_339365" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3728" name="Constant_341018" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3729" name="Constant_339367" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3730" name="Gather_339368" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="2724"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3731" name="Constant_433054" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="3732" name="Constant_433047" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3733" name="Constant_433049" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3734" name="Constant_433051" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3735" name="Concat_433052" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3736" name="Broadcast_433055" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3737" name="ReadValue_417314" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.16.keypresent.16.key" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.16.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3738" name="Constant_401986" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3739" name="Gather_401987" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3740" name="ShapeOf_339370" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3741" name="Constant_339371" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3742" name="Constant_339372" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3743" name="Gather_339373" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="2726" /> + </output> + </layer> + <layer id="3744" name="Constant_337744" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3745" name="Reshape_340937" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3746" name="__module.model.gpt_neox.layers.16.attention/aten::add_/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="2725,2729,2730,seq_len.65"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3747" name="__module.model.gpt_neox.layers.16.attention.rotary_emb/aten::slice/Unsqueeze_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3748" name="__module.model.gpt_neox.layers.16.attention.rotary_emb/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2733,2736,cos.65"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3749" name="Constant_38323" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="3750" name="__module.model.gpt_neox.layers.16.attention/aten::index/Gather" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="2739"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3751" name="__module.model.gpt_neox.layers.16.attention/aten::unsqueeze/Unsqueeze" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="2740,cos.67"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3752" name="__module.model.gpt_neox.layers.16.attention/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2744"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3753" name="Constant_300034" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3754" name="Constant_300033" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3755" name="__module.model.gpt_neox.layers.16.attention/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3756" name="__module.model.gpt_neox.layers.16.attention/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="3757" name="__module.model.gpt_neox.layers.16.attention/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="2745,2750" /> + </output> + </layer> + <layer id="3758" name="__module.model.gpt_neox.layers.16.attention/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="3759" name="__module.model.gpt_neox.layers.16.attention/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="2747,2748,2752,2753" /> + </output> + </layer> + <layer id="3760" name="Constant_337746" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3761" name="__module.model.gpt_neox.layers.16.attention/aten::slice/Unsqueeze_17" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3762" name="Constant_300032" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3763" name="ScatterUpdate_300035" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3764" name="Constant_300038" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3765" name="Constant_300041" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3766" name="__module.model.gpt_neox.layers.16.attention/aten::slice/Slice_3" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2754,x2.65"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="3767" name="Constant_325354" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3768" name="__module.model.gpt_neox.layers.16.attention/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2755"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="3769" name="Constant_300086" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3770" name="Constant_300091" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3771" name="__module.model.gpt_neox.layers.16.attention/aten::slice/Slice_4" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2749"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="3772" name="__module.model.gpt_neox.layers.16.attention/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2757"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3773" name="self.model.gpt_neox.layers.16.attention.rotary_emb.sin_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="258220060" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.16.attention.rotary_emb.sin_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3774" name="__module.model.gpt_neox.layers.16.attention.rotary_emb/aten::slice/Unsqueeze_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3775" name="__module.model.gpt_neox.layers.16.attention.rotary_emb/aten::slice/Unsqueeze_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3776" name="__module.model.gpt_neox.layers.16.attention.rotary_emb/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2734,2737,sin.65"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3777" name="Constant_38326" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="3778" name="__module.model.gpt_neox.layers.16.attention/aten::index/Gather_1" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="2742"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3779" name="__module.model.gpt_neox.layers.16.attention/aten::unsqueeze/Unsqueeze_1" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="2743,sin.67"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3780" name="__module.model.gpt_neox.layers.16.attention/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2758"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3781" name="__module.model.gpt_neox.layers.16.attention/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2759,2777,2787,query.101,query.99"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3782" name="Constant_9532" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="2715"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3783" name="__module.model.gpt_neox.layers.16.attention/aten::permute/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2716,key.97"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3784" name="Constant_300137" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3785" name="Constant_300140" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3786" name="Constant_300143" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3787" name="__module.model.gpt_neox.layers.16.attention/aten::slice/Slice_6" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2722,k.33"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3788" name="__module.model.gpt_neox.layers.16.attention/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2760"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3789" name="Constant_300147" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3790" name="Constant_300146" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3791" name="__module.model.gpt_neox.layers.16.attention/aten::size/ShapeOf_7" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3792" name="__module.model.gpt_neox.layers.16.attention/aten::size/Constant_7" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="3793" name="__module.model.gpt_neox.layers.16.attention/aten::size/Gather_7" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="2761,2766" /> + </output> + </layer> + <layer id="3794" name="__module.model.gpt_neox.layers.16.attention/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="3795" name="__module.model.gpt_neox.layers.16.attention/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="2763,2764,2768,2769" /> + </output> + </layer> + <layer id="3796" name="Constant_337748" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3797" name="__module.model.gpt_neox.layers.16.attention/aten::slice/Unsqueeze_33" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3798" name="Constant_300145" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3799" name="ScatterUpdate_300148" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3800" name="Constant_300151" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3801" name="Constant_300154" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3802" name="__module.model.gpt_neox.layers.16.attention/aten::slice/Slice_7" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2770,x2.67"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="3803" name="Constant_325355" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3804" name="__module.model.gpt_neox.layers.16.attention/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2771"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="3805" name="Constant_300199" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3806" name="Constant_300204" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3807" name="__module.model.gpt_neox.layers.16.attention/aten::slice/Slice_8" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2765"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="3808" name="__module.model.gpt_neox.layers.16.attention/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2773"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3809" name="__module.model.gpt_neox.layers.16.attention/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2774"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3810" name="__module.model.gpt_neox.layers.16.attention/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2775,2779"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3811" name="__module.model.gpt_neox.layers.16.attention/aten::to/Convert_1" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.16.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3812" name="Constant_433067" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="3813" name="Constant_433060" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3814" name="Constant_433062" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3815" name="Constant_433064" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3816" name="Concat_433065" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3817" name="Broadcast_433068" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3818" name="ReadValue_417316" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.16.valuepresent.16.value" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.16.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3819" name="Constant_401989" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3820" name="Gather_401990" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3821" name="Constant_300249" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3822" name="Constant_300252" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3823" name="Constant_300255" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3824" name="__module.model.gpt_neox.layers.16.attention/aten::slice/Slice_10" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2717"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3825" name="Constant_9546" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="2718"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3826" name="__module.model.gpt_neox.layers.16.attention/aten::permute/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2719"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3827" name="__module.model.gpt_neox.layers.16.attention/aten::cat/Concat_5" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.16.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3828" name="__module.model.gpt_neox.layers.16.attention/aten::slice/Slice_11" type="Const" version="opset1"> + <data element_type="boolean" shape="1, 1, 2048, 2048" offset="259268636" size="4194304" /> + <output> + <port id="0" precision="BOOL" names="2796"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="3829" name="Constant_300259" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="3830" name="Constant_300258" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3831" name="ShapeOf_339375" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3832" name="Constant_339376" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3833" name="Constant_339377" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3834" name="Gather_339378" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" /> + </output> + </layer> + <layer id="3835" name="Add_339379" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="2791" /> + </output> + </layer> + <layer id="3836" name="ShapeOf_339446" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3837" name="Constant_339447" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3838" name="Constant_339448" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3839" name="Gather_339449" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="2789" /> + </output> + </layer> + <layer id="3840" name="__module.model.gpt_neox.layers.16.attention/aten::sub/Subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="2793,2794" /> + </output> + </layer> + <layer id="3841" name="Constant_337750" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3842" name="__module.model.gpt_neox.layers.16.attention/aten::slice/Unsqueeze_44" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3843" name="Constant_300257" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3844" name="ScatterUpdate_300260" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="3845" name="Constant_300261" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="3846" name="Constant_337752" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3847" name="__module.model.gpt_neox.layers.16.attention/aten::slice/Unsqueeze_45" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3848" name="ScatterUpdate_300262" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="3849" name="Constant_300265" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462964" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="3850" name="__module.model.gpt_neox.layers.16.attention/aten::slice/Slice_12" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 0" end_mask="1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + <port id="2" precision="I64"> + <dim>3</dim> + </port> + <port id="3" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="2797"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="3851" name="Constant_300338" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3852" name="Constant_300339" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3853" name="Constant_300335" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3854" name="Constant_300334" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3855" name="ScatterUpdate_300340" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3856" name="Constant_300343" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3857" name="__module.model.gpt_neox.layers.16.attention/aten::slice/Slice_13" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="2798,2799"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="3858" name="__module.model.gpt_neox.layers.16.attention/aten::where/Convert_1" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="3859" name="__module.model.gpt_neox.layers.16.attention/aten::full/Convert" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="263462988" size="4" /> + <output> + <port id="0" precision="FP32" names="2786" /> + </output> + </layer> + <layer id="3860" name="__module.model.gpt_neox.layers.16.attention/aten::where/Select" type="Select" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32" /> + <port id="2" precision="FP32" /> + </input> + <output> + <port id="3" precision="FP32" names="2800,causal_mask.65"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="3861" name="Add_316140" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="3862" name="ShapeOf_316141" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3863" name="Constant_339452" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3864" name="Constant_339453" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3865" name="Gather_339454" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="2784"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3866" name="Constant_268121" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3867" name="Constant_268123" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3868" name="Constant_268125" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3869" name="__module.model.gpt_neox.layers.16.attention/prim::ListConstruct/Concat_1" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="2801"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3870" name="Maximum_316142" type="Maximum" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3871" name="__module.model.gpt_neox.layers.16.attention/aten::add/Add_2" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2803"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="3872" name="__module.model.gpt_neox.layers.16.attention/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2804,2805,sdpa_result.33,tensor.65"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3873" name="Constant_9987" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="2806"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3874" name="__module.model.gpt_neox.layers.16.attention/aten::permute/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2807"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3875" name="__module.model.gpt_neox.layers.16.attention/prim::ListConstruct/Concat_2" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263463020" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="3876" name="__module.model.gpt_neox.layers.16.attention/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2812"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3877" name="self.model.gpt_neox.layers.16.attention.dense.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 4096" offset="3489865860" size="16777216" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3878" name="Convert_449570" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3879" name="self.model.gpt_neox.layers.16.attention.dense.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="3506643076" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3880" name="Convert_449573" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3881" name="self.model.gpt_neox.layers.16.attention.dense.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3882" name="self.model.gpt_neox.layers.16.attention.dense.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="3506647172" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3883" name="self.model.gpt_neox.layers.16.attention.dense.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3884" name="self.model.gpt_neox.layers.16.attention.dense.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3885" name="__module.model.gpt_neox.layers.16.attention.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3886" name="Constant_325356" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="3506655364" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3887" name="__module.model.gpt_neox.layers.16.attention.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2815,2817,input.67"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3888" name="__module.model.gpt_neox.layers.16/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2821,attn_output.67"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3889" name="__module.model.gpt_neox.layers.16.post_attention_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3890" name="__module.model.gpt_neox.layers.16.post_attention_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3891" name="Constant_325357" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="3506671748" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3892" name="__module.model.gpt_neox.layers.16.post_attention_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3893" name="Constant_325358" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="3506688132" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3894" name="__module.model.gpt_neox.layers.16.post_attention_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2825"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3895" name="self.model.gpt_neox.layers.16.mlp.dense_h_to_4h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 4096" offset="3506704516" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3896" name="Convert_449581" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3897" name="self.model.gpt_neox.layers.16.mlp.dense_h_to_4h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 1" offset="3573813380" size="16384" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3898" name="Convert_449584" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3899" name="self.model.gpt_neox.layers.16.mlp.dense_h_to_4h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3900" name="self.model.gpt_neox.layers.16.mlp.dense_h_to_4h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="16384, 1" offset="3573829764" size="32768" /> + <output> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3901" name="self.model.gpt_neox.layers.16.mlp.dense_h_to_4h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3902" name="self.model.gpt_neox.layers.16.mlp.dense_h_to_4h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3903" name="__module.model.gpt_neox.layers.16.mlp.dense_h_to_4h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="3904" name="Constant_325359" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 16384" offset="3573862532" size="65536" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="3905" name="__module.model.gpt_neox.layers.16.mlp.dense_h_to_4h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2830"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="3906" name="__module.model.gpt_neox.layers.16.mlp.act/aten::gelu/Gelu" type="Gelu" version="opset7"> + <data approximation_mode="ERF" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="2831"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="3907" name="self.model.gpt_neox.layers.16.mlp.dense_4h_to_h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 16384" offset="3573928068" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="3908" name="Convert_449592" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="3909" name="self.model.gpt_neox.layers.16.mlp.dense_4h_to_h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="3641036932" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3910" name="Convert_449595" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3911" name="self.model.gpt_neox.layers.16.mlp.dense_4h_to_h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="3912" name="self.model.gpt_neox.layers.16.mlp.dense_4h_to_h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="3641041028" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3913" name="self.model.gpt_neox.layers.16.mlp.dense_4h_to_h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="3914" name="self.model.gpt_neox.layers.16.mlp.dense_4h_to_h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="3915" name="__module.model.gpt_neox.layers.16.mlp.dense_4h_to_h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3916" name="Constant_325360" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="3641049220" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3917" name="__module.model.gpt_neox.layers.16.mlp.dense_4h_to_h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2834,input.69"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3918" name="__module.model.gpt_neox.layers.16/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2836,2838,hidden_states.35"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3919" name="__module.model.gpt_neox.layers.17.input_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3920" name="__module.model.gpt_neox.layers.17.input_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3921" name="Constant_325361" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="3641065604" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3922" name="__module.model.gpt_neox.layers.17.input_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3923" name="Constant_325362" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="3641081988" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3924" name="__module.model.gpt_neox.layers.17.input_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2848"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3925" name="self.model.gpt_neox.layers.17.attention.query_key_value.weight" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 4096" offset="3641098372" size="50331648" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3926" name="Convert_449603" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3927" name="self.model.gpt_neox.layers.17.attention.query_key_value.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 1" offset="3691430020" size="12288" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3928" name="Convert_449606" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3929" name="self.model.gpt_neox.layers.17.attention.query_key_value.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3930" name="self.model.gpt_neox.layers.17.attention.query_key_value.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="12288, 1" offset="3691442308" size="24576" /> + <output> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3931" name="self.model.gpt_neox.layers.17.attention.query_key_value.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3932" name="self.model.gpt_neox.layers.17.attention.query_key_value.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="3933" name="__module.model.gpt_neox.layers.17.attention.query_key_value/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="3934" name="Constant_325363" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 12288" offset="3691466884" size="49152" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="3935" name="__module.model.gpt_neox.layers.17.attention.query_key_value/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2855,qkv.69"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="3936" name="__module.model.gpt_neox.layers.17.attention/prim::ListConstruct/Concat" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171232" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3937" name="__module.model.gpt_neox.layers.17.attention/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2859,qkv.71"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + </output> + </layer> + <layer id="3938" name="Constant_300350" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3939" name="Constant_300353" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3940" name="Constant_300356" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3941" name="__module.model.gpt_neox.layers.17.attention/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2860"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3942" name="Constant_10099" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="2861"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3943" name="__module.model.gpt_neox.layers.17.attention/aten::permute/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2862,query.103"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3944" name="Constant_300362" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3945" name="Constant_300365" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3946" name="Constant_300368" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3947" name="__module.model.gpt_neox.layers.17.attention/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2869,q.35"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3948" name="self.model.gpt_neox.layers.17.attention.rotary_emb.cos_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="257171392" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.17.attention.rotary_emb.cos_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3949" name="__module.model.gpt_neox.layers.17.attention.rotary_emb/aten::slice/Unsqueeze" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3950" name="Constant_300374" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3951" name="Constant_300377" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3952" name="Constant_300380" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3953" name="__module.model.gpt_neox.layers.17.attention/aten::slice/Slice_2" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2863"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3954" name="ShapeOf_339456" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3955" name="Constant_341021" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3956" name="Constant_339458" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3957" name="Gather_339459" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="2873"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3958" name="Constant_433080" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="3959" name="Constant_433073" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3960" name="Constant_433075" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3961" name="Constant_433077" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3962" name="Concat_433078" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3963" name="Broadcast_433081" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3964" name="ReadValue_417318" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.17.keypresent.17.key" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.17.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3965" name="Constant_401992" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3966" name="Gather_401993" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3967" name="ShapeOf_339461" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3968" name="Constant_339462" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3969" name="Constant_339463" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3970" name="Gather_339464" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="2875" /> + </output> + </layer> + <layer id="3971" name="Constant_337754" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3972" name="Reshape_340939" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3973" name="__module.model.gpt_neox.layers.17.attention/aten::add_/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="2874,2878,2879,seq_len.69"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3974" name="__module.model.gpt_neox.layers.17.attention.rotary_emb/aten::slice/Unsqueeze_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3975" name="__module.model.gpt_neox.layers.17.attention.rotary_emb/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2882,2885,cos.69"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3976" name="Constant_38329" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="3977" name="__module.model.gpt_neox.layers.17.attention/aten::index/Gather" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="2888"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3978" name="__module.model.gpt_neox.layers.17.attention/aten::unsqueeze/Unsqueeze" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="2889,cos.71"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3979" name="__module.model.gpt_neox.layers.17.attention/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2893"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3980" name="Constant_300385" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3981" name="Constant_300384" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3982" name="__module.model.gpt_neox.layers.17.attention/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3983" name="__module.model.gpt_neox.layers.17.attention/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="3984" name="__module.model.gpt_neox.layers.17.attention/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="2894,2899" /> + </output> + </layer> + <layer id="3985" name="__module.model.gpt_neox.layers.17.attention/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="3986" name="__module.model.gpt_neox.layers.17.attention/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="2896,2897,2901,2902" /> + </output> + </layer> + <layer id="3987" name="Constant_337756" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3988" name="__module.model.gpt_neox.layers.17.attention/aten::slice/Unsqueeze_17" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3989" name="Constant_300383" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3990" name="ScatterUpdate_300386" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3991" name="Constant_300389" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3992" name="Constant_300392" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3993" name="__module.model.gpt_neox.layers.17.attention/aten::slice/Slice_3" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2903,x2.69"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="3994" name="Constant_325364" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3995" name="__module.model.gpt_neox.layers.17.attention/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2904"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="3996" name="Constant_300437" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3997" name="Constant_300442" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3998" name="__module.model.gpt_neox.layers.17.attention/aten::slice/Slice_4" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2898"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="3999" name="__module.model.gpt_neox.layers.17.attention/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2906"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4000" name="self.model.gpt_neox.layers.17.attention.rotary_emb.sin_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="258220060" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.17.attention.rotary_emb.sin_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4001" name="__module.model.gpt_neox.layers.17.attention.rotary_emb/aten::slice/Unsqueeze_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4002" name="__module.model.gpt_neox.layers.17.attention.rotary_emb/aten::slice/Unsqueeze_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4003" name="__module.model.gpt_neox.layers.17.attention.rotary_emb/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2883,2886,sin.69"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4004" name="Constant_38332" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="4005" name="__module.model.gpt_neox.layers.17.attention/aten::index/Gather_1" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="2891"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4006" name="__module.model.gpt_neox.layers.17.attention/aten::unsqueeze/Unsqueeze_1" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="2892,sin.71"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4007" name="__module.model.gpt_neox.layers.17.attention/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2907"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4008" name="__module.model.gpt_neox.layers.17.attention/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2908,2926,2936,query.105,query.107"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4009" name="Constant_10113" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="2864"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4010" name="__module.model.gpt_neox.layers.17.attention/aten::permute/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2865,key.103"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4011" name="Constant_300488" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4012" name="Constant_300491" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4013" name="Constant_300494" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4014" name="__module.model.gpt_neox.layers.17.attention/aten::slice/Slice_6" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2871,k.35"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4015" name="__module.model.gpt_neox.layers.17.attention/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2909"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4016" name="Constant_300498" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4017" name="Constant_300497" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4018" name="__module.model.gpt_neox.layers.17.attention/aten::size/ShapeOf_7" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4019" name="__module.model.gpt_neox.layers.17.attention/aten::size/Constant_7" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="4020" name="__module.model.gpt_neox.layers.17.attention/aten::size/Gather_7" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="2910,2915" /> + </output> + </layer> + <layer id="4021" name="__module.model.gpt_neox.layers.17.attention/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="4022" name="__module.model.gpt_neox.layers.17.attention/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="2912,2913,2917,2918" /> + </output> + </layer> + <layer id="4023" name="Constant_337758" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4024" name="__module.model.gpt_neox.layers.17.attention/aten::slice/Unsqueeze_33" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4025" name="Constant_300496" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4026" name="ScatterUpdate_300499" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4027" name="Constant_300502" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4028" name="Constant_300505" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4029" name="__module.model.gpt_neox.layers.17.attention/aten::slice/Slice_7" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2919,x2.71"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="4030" name="Constant_325365" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4031" name="__module.model.gpt_neox.layers.17.attention/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2920"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="4032" name="Constant_300550" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4033" name="Constant_300555" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4034" name="__module.model.gpt_neox.layers.17.attention/aten::slice/Slice_8" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2914"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="4035" name="__module.model.gpt_neox.layers.17.attention/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2922"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4036" name="__module.model.gpt_neox.layers.17.attention/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2923"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4037" name="__module.model.gpt_neox.layers.17.attention/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2924,2928"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4038" name="__module.model.gpt_neox.layers.17.attention/aten::to/Convert_1" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.17.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4039" name="Constant_433093" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="4040" name="Constant_433086" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4041" name="Constant_433088" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4042" name="Constant_433090" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4043" name="Concat_433091" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4044" name="Broadcast_433094" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4045" name="ReadValue_417320" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.17.valuepresent.17.value" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.17.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4046" name="Constant_401995" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4047" name="Gather_401996" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4048" name="Constant_300600" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4049" name="Constant_300603" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4050" name="Constant_300606" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4051" name="__module.model.gpt_neox.layers.17.attention/aten::slice/Slice_10" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2866"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4052" name="Constant_10127" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="2867"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4053" name="__module.model.gpt_neox.layers.17.attention/aten::permute/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2868"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4054" name="__module.model.gpt_neox.layers.17.attention/aten::cat/Concat_5" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.17.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4055" name="__module.model.gpt_neox.layers.17.attention/aten::slice/Slice_11" type="Const" version="opset1"> + <data element_type="boolean" shape="1, 1, 2048, 2048" offset="259268636" size="4194304" /> + <output> + <port id="0" precision="BOOL" names="2945"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="4056" name="Constant_300610" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="4057" name="Constant_300609" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4058" name="ShapeOf_339466" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4059" name="Constant_339467" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4060" name="Constant_339468" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4061" name="Gather_339469" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" /> + </output> + </layer> + <layer id="4062" name="Add_339470" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="2940" /> + </output> + </layer> + <layer id="4063" name="ShapeOf_339537" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4064" name="Constant_339538" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4065" name="Constant_339539" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4066" name="Gather_339540" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="2938" /> + </output> + </layer> + <layer id="4067" name="__module.model.gpt_neox.layers.17.attention/aten::sub/Subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="2942,2943" /> + </output> + </layer> + <layer id="4068" name="Constant_337760" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4069" name="__module.model.gpt_neox.layers.17.attention/aten::slice/Unsqueeze_44" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4070" name="Constant_300608" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4071" name="ScatterUpdate_300611" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="4072" name="Constant_300612" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="4073" name="Constant_337762" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4074" name="__module.model.gpt_neox.layers.17.attention/aten::slice/Unsqueeze_45" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4075" name="ScatterUpdate_300613" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="4076" name="Constant_300616" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462964" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="4077" name="__module.model.gpt_neox.layers.17.attention/aten::slice/Slice_12" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 0" end_mask="1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + <port id="2" precision="I64"> + <dim>3</dim> + </port> + <port id="3" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="2946"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="4078" name="Constant_300689" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4079" name="Constant_300690" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4080" name="Constant_300686" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4081" name="Constant_300685" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4082" name="ScatterUpdate_300691" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4083" name="Constant_300694" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4084" name="__module.model.gpt_neox.layers.17.attention/aten::slice/Slice_13" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="2947,2948"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="4085" name="__module.model.gpt_neox.layers.17.attention/aten::where/Convert_1" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="4086" name="__module.model.gpt_neox.layers.17.attention/aten::full/Convert" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="263462988" size="4" /> + <output> + <port id="0" precision="FP32" names="2935" /> + </output> + </layer> + <layer id="4087" name="__module.model.gpt_neox.layers.17.attention/aten::where/Select" type="Select" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32" /> + <port id="2" precision="FP32" /> + </input> + <output> + <port id="3" precision="FP32" names="2949,causal_mask.69"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="4088" name="Add_316212" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="4089" name="ShapeOf_316213" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4090" name="Constant_339543" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4091" name="Constant_339544" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4092" name="Gather_339545" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="2933"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4093" name="Constant_268131" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4094" name="Constant_268133" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4095" name="Constant_268135" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4096" name="__module.model.gpt_neox.layers.17.attention/prim::ListConstruct/Concat_1" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="2950"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4097" name="Maximum_316214" type="Maximum" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4098" name="__module.model.gpt_neox.layers.17.attention/aten::add/Add_2" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2952"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="4099" name="__module.model.gpt_neox.layers.17.attention/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2953,2954,sdpa_result.35,tensor.69"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4100" name="Constant_10568" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="2955"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4101" name="__module.model.gpt_neox.layers.17.attention/aten::permute/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2956"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4102" name="__module.model.gpt_neox.layers.17.attention/prim::ListConstruct/Concat_2" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263463020" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="4103" name="__module.model.gpt_neox.layers.17.attention/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2961"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4104" name="self.model.gpt_neox.layers.17.attention.dense.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 4096" offset="3691516036" size="16777216" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4105" name="Convert_449614" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4106" name="self.model.gpt_neox.layers.17.attention.dense.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="3708293252" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4107" name="Convert_449617" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4108" name="self.model.gpt_neox.layers.17.attention.dense.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4109" name="self.model.gpt_neox.layers.17.attention.dense.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="3708297348" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4110" name="self.model.gpt_neox.layers.17.attention.dense.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4111" name="self.model.gpt_neox.layers.17.attention.dense.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4112" name="__module.model.gpt_neox.layers.17.attention.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4113" name="Constant_325366" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="3708305540" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4114" name="__module.model.gpt_neox.layers.17.attention.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2964,2966,input.71"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4115" name="__module.model.gpt_neox.layers.17/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2970,attn_output.71"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4116" name="__module.model.gpt_neox.layers.17.post_attention_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4117" name="__module.model.gpt_neox.layers.17.post_attention_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4118" name="Constant_325367" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="3708321924" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4119" name="__module.model.gpt_neox.layers.17.post_attention_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4120" name="Constant_325368" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="3708338308" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4121" name="__module.model.gpt_neox.layers.17.post_attention_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2974"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4122" name="self.model.gpt_neox.layers.17.mlp.dense_h_to_4h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 4096" offset="3708354692" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4123" name="Convert_449625" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4124" name="self.model.gpt_neox.layers.17.mlp.dense_h_to_4h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 1" offset="3775463556" size="16384" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4125" name="Convert_449628" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4126" name="self.model.gpt_neox.layers.17.mlp.dense_h_to_4h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4127" name="self.model.gpt_neox.layers.17.mlp.dense_h_to_4h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="16384, 1" offset="3775479940" size="32768" /> + <output> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4128" name="self.model.gpt_neox.layers.17.mlp.dense_h_to_4h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4129" name="self.model.gpt_neox.layers.17.mlp.dense_h_to_4h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4130" name="__module.model.gpt_neox.layers.17.mlp.dense_h_to_4h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="4131" name="Constant_325369" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 16384" offset="3775512708" size="65536" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="4132" name="__module.model.gpt_neox.layers.17.mlp.dense_h_to_4h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2979"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="4133" name="__module.model.gpt_neox.layers.17.mlp.act/aten::gelu/Gelu" type="Gelu" version="opset7"> + <data approximation_mode="ERF" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="2980"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="4134" name="self.model.gpt_neox.layers.17.mlp.dense_4h_to_h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 16384" offset="3775578244" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="4135" name="Convert_449636" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="4136" name="self.model.gpt_neox.layers.17.mlp.dense_4h_to_h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="3842687108" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4137" name="Convert_449639" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4138" name="self.model.gpt_neox.layers.17.mlp.dense_4h_to_h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="4139" name="self.model.gpt_neox.layers.17.mlp.dense_4h_to_h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="3842691204" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4140" name="self.model.gpt_neox.layers.17.mlp.dense_4h_to_h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="4141" name="self.model.gpt_neox.layers.17.mlp.dense_4h_to_h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="4142" name="__module.model.gpt_neox.layers.17.mlp.dense_4h_to_h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4143" name="Constant_325370" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="3842699396" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4144" name="__module.model.gpt_neox.layers.17.mlp.dense_4h_to_h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2983,input.73"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4145" name="__module.model.gpt_neox.layers.17/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2985,2987,hidden_states.37"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4146" name="__module.model.gpt_neox.layers.18.input_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4147" name="__module.model.gpt_neox.layers.18.input_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4148" name="Constant_325371" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="3842715780" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4149" name="__module.model.gpt_neox.layers.18.input_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4150" name="Constant_325372" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="3842732164" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4151" name="__module.model.gpt_neox.layers.18.input_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2997"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4152" name="self.model.gpt_neox.layers.18.attention.query_key_value.weight" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 4096" offset="3842748548" size="50331648" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4153" name="Convert_449647" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4154" name="self.model.gpt_neox.layers.18.attention.query_key_value.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 1" offset="3893080196" size="12288" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4155" name="Convert_449650" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4156" name="self.model.gpt_neox.layers.18.attention.query_key_value.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4157" name="self.model.gpt_neox.layers.18.attention.query_key_value.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="12288, 1" offset="3893092484" size="24576" /> + <output> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4158" name="self.model.gpt_neox.layers.18.attention.query_key_value.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4159" name="self.model.gpt_neox.layers.18.attention.query_key_value.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4160" name="__module.model.gpt_neox.layers.18.attention.query_key_value/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="4161" name="Constant_325373" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 12288" offset="3893117060" size="49152" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="4162" name="__module.model.gpt_neox.layers.18.attention.query_key_value/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3004,qkv.73"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="4163" name="__module.model.gpt_neox.layers.18.attention/prim::ListConstruct/Concat" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171232" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4164" name="__module.model.gpt_neox.layers.18.attention/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3008,qkv.75"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + </output> + </layer> + <layer id="4165" name="Constant_300701" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4166" name="Constant_300704" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4167" name="Constant_300707" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4168" name="__module.model.gpt_neox.layers.18.attention/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3009"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4169" name="Constant_10680" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="3010"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4170" name="__module.model.gpt_neox.layers.18.attention/aten::permute/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3011,query.109"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4171" name="Constant_300713" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4172" name="Constant_300716" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4173" name="Constant_300719" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4174" name="__module.model.gpt_neox.layers.18.attention/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3018,q.37"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4175" name="self.model.gpt_neox.layers.18.attention.rotary_emb.cos_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="257171392" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.18.attention.rotary_emb.cos_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4176" name="__module.model.gpt_neox.layers.18.attention.rotary_emb/aten::slice/Unsqueeze" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4177" name="Constant_300725" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4178" name="Constant_300728" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4179" name="Constant_300731" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4180" name="__module.model.gpt_neox.layers.18.attention/aten::slice/Slice_2" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3012"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4181" name="ShapeOf_339547" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4182" name="Constant_341024" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4183" name="Constant_339549" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4184" name="Gather_339550" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="3022"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4185" name="Constant_433106" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="4186" name="Constant_433099" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4187" name="Constant_433101" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4188" name="Constant_433103" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4189" name="Concat_433104" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4190" name="Broadcast_433107" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4191" name="ReadValue_417322" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.18.keypresent.18.key" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.18.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4192" name="Constant_401998" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4193" name="Gather_401999" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4194" name="ShapeOf_339552" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4195" name="Constant_339553" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4196" name="Constant_339554" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4197" name="Gather_339555" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="3024" /> + </output> + </layer> + <layer id="4198" name="Constant_337764" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4199" name="Reshape_340941" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4200" name="__module.model.gpt_neox.layers.18.attention/aten::add_/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="3023,3027,3028,seq_len.73"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4201" name="__module.model.gpt_neox.layers.18.attention.rotary_emb/aten::slice/Unsqueeze_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4202" name="__module.model.gpt_neox.layers.18.attention.rotary_emb/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3031,3034,cos.73"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4203" name="Constant_38335" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="4204" name="__module.model.gpt_neox.layers.18.attention/aten::index/Gather" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="3037"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4205" name="__module.model.gpt_neox.layers.18.attention/aten::unsqueeze/Unsqueeze" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="3038,cos.75"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4206" name="__module.model.gpt_neox.layers.18.attention/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3042"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4207" name="Constant_300736" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4208" name="Constant_300735" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4209" name="__module.model.gpt_neox.layers.18.attention/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4210" name="__module.model.gpt_neox.layers.18.attention/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="4211" name="__module.model.gpt_neox.layers.18.attention/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="3043,3048" /> + </output> + </layer> + <layer id="4212" name="__module.model.gpt_neox.layers.18.attention/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="4213" name="__module.model.gpt_neox.layers.18.attention/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="3045,3046,3050,3051" /> + </output> + </layer> + <layer id="4214" name="Constant_337766" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4215" name="__module.model.gpt_neox.layers.18.attention/aten::slice/Unsqueeze_17" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4216" name="Constant_300734" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4217" name="ScatterUpdate_300737" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4218" name="Constant_300740" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4219" name="Constant_300743" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4220" name="__module.model.gpt_neox.layers.18.attention/aten::slice/Slice_3" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3052,x2.73"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="4221" name="Constant_325374" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4222" name="__module.model.gpt_neox.layers.18.attention/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3053"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="4223" name="Constant_300788" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4224" name="Constant_300793" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4225" name="__module.model.gpt_neox.layers.18.attention/aten::slice/Slice_4" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3047"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="4226" name="__module.model.gpt_neox.layers.18.attention/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3055"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4227" name="self.model.gpt_neox.layers.18.attention.rotary_emb.sin_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="258220060" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.18.attention.rotary_emb.sin_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4228" name="__module.model.gpt_neox.layers.18.attention.rotary_emb/aten::slice/Unsqueeze_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4229" name="__module.model.gpt_neox.layers.18.attention.rotary_emb/aten::slice/Unsqueeze_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4230" name="__module.model.gpt_neox.layers.18.attention.rotary_emb/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3032,3035,sin.73"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4231" name="Constant_38338" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="4232" name="__module.model.gpt_neox.layers.18.attention/aten::index/Gather_1" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="3040"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4233" name="__module.model.gpt_neox.layers.18.attention/aten::unsqueeze/Unsqueeze_1" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="3041,sin.75"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4234" name="__module.model.gpt_neox.layers.18.attention/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3056"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4235" name="__module.model.gpt_neox.layers.18.attention/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3057,3075,3085,query.111,query.113"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4236" name="Constant_10694" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="3013"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4237" name="__module.model.gpt_neox.layers.18.attention/aten::permute/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3014,key.109"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4238" name="Constant_300839" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4239" name="Constant_300842" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4240" name="Constant_300845" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4241" name="__module.model.gpt_neox.layers.18.attention/aten::slice/Slice_6" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3020,k.37"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4242" name="__module.model.gpt_neox.layers.18.attention/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3058"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4243" name="Constant_300849" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4244" name="Constant_300848" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4245" name="__module.model.gpt_neox.layers.18.attention/aten::size/ShapeOf_7" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4246" name="__module.model.gpt_neox.layers.18.attention/aten::size/Constant_7" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="4247" name="__module.model.gpt_neox.layers.18.attention/aten::size/Gather_7" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="3059,3064" /> + </output> + </layer> + <layer id="4248" name="__module.model.gpt_neox.layers.18.attention/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="4249" name="__module.model.gpt_neox.layers.18.attention/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="3061,3062,3066,3067" /> + </output> + </layer> + <layer id="4250" name="Constant_337768" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4251" name="__module.model.gpt_neox.layers.18.attention/aten::slice/Unsqueeze_33" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4252" name="Constant_300847" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4253" name="ScatterUpdate_300850" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4254" name="Constant_300853" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4255" name="Constant_300856" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4256" name="__module.model.gpt_neox.layers.18.attention/aten::slice/Slice_7" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3068,x2.75"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="4257" name="Constant_325375" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4258" name="__module.model.gpt_neox.layers.18.attention/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3069"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="4259" name="Constant_300901" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4260" name="Constant_300906" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4261" name="__module.model.gpt_neox.layers.18.attention/aten::slice/Slice_8" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3063"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="4262" name="__module.model.gpt_neox.layers.18.attention/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3071"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4263" name="__module.model.gpt_neox.layers.18.attention/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3072"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4264" name="__module.model.gpt_neox.layers.18.attention/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3073,3077"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4265" name="__module.model.gpt_neox.layers.18.attention/aten::to/Convert_1" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.18.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4266" name="Constant_433119" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="4267" name="Constant_433112" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4268" name="Constant_433114" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4269" name="Constant_433116" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4270" name="Concat_433117" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4271" name="Broadcast_433120" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4272" name="ReadValue_417324" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.18.valuepresent.18.value" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.18.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4273" name="Constant_402001" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4274" name="Gather_402002" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4275" name="Constant_300951" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4276" name="Constant_300954" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4277" name="Constant_300957" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4278" name="__module.model.gpt_neox.layers.18.attention/aten::slice/Slice_10" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3015"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4279" name="Constant_10708" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="3016"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4280" name="__module.model.gpt_neox.layers.18.attention/aten::permute/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3017"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4281" name="__module.model.gpt_neox.layers.18.attention/aten::cat/Concat_5" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.18.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4282" name="__module.model.gpt_neox.layers.18.attention/aten::slice/Slice_11" type="Const" version="opset1"> + <data element_type="boolean" shape="1, 1, 2048, 2048" offset="259268636" size="4194304" /> + <output> + <port id="0" precision="BOOL" names="3094"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="4283" name="Constant_300961" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="4284" name="Constant_300960" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4285" name="ShapeOf_339557" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4286" name="Constant_339558" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4287" name="Constant_339559" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4288" name="Gather_339560" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" /> + </output> + </layer> + <layer id="4289" name="Add_339561" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="3089" /> + </output> + </layer> + <layer id="4290" name="ShapeOf_339628" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4291" name="Constant_339629" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4292" name="Constant_339630" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4293" name="Gather_339631" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="3087" /> + </output> + </layer> + <layer id="4294" name="__module.model.gpt_neox.layers.18.attention/aten::sub/Subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="3091,3092" /> + </output> + </layer> + <layer id="4295" name="Constant_337770" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4296" name="__module.model.gpt_neox.layers.18.attention/aten::slice/Unsqueeze_44" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4297" name="Constant_300959" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4298" name="ScatterUpdate_300962" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="4299" name="Constant_300963" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="4300" name="Constant_337772" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4301" name="__module.model.gpt_neox.layers.18.attention/aten::slice/Unsqueeze_45" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4302" name="ScatterUpdate_300964" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="4303" name="Constant_300967" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462964" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="4304" name="__module.model.gpt_neox.layers.18.attention/aten::slice/Slice_12" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 0" end_mask="1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + <port id="2" precision="I64"> + <dim>3</dim> + </port> + <port id="3" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="3095"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="4305" name="Constant_301040" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4306" name="Constant_301041" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4307" name="Constant_301037" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4308" name="Constant_301036" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4309" name="ScatterUpdate_301042" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4310" name="Constant_301045" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4311" name="__module.model.gpt_neox.layers.18.attention/aten::slice/Slice_13" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="3096,3097"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="4312" name="__module.model.gpt_neox.layers.18.attention/aten::where/Convert_1" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="4313" name="__module.model.gpt_neox.layers.18.attention/aten::full/Convert" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="263462988" size="4" /> + <output> + <port id="0" precision="FP32" names="3084" /> + </output> + </layer> + <layer id="4314" name="__module.model.gpt_neox.layers.18.attention/aten::where/Select" type="Select" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32" /> + <port id="2" precision="FP32" /> + </input> + <output> + <port id="3" precision="FP32" names="3098,causal_mask.73"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="4315" name="Add_316284" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="4316" name="ShapeOf_316285" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4317" name="Constant_339634" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4318" name="Constant_339635" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4319" name="Gather_339636" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="3082"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4320" name="Constant_268141" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4321" name="Constant_268143" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4322" name="Constant_268145" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4323" name="__module.model.gpt_neox.layers.18.attention/prim::ListConstruct/Concat_1" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="3099"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4324" name="Maximum_316286" type="Maximum" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4325" name="__module.model.gpt_neox.layers.18.attention/aten::add/Add_2" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3101"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="4326" name="__module.model.gpt_neox.layers.18.attention/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3102,3103,sdpa_result.37,tensor.73"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4327" name="Constant_11149" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="3104"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4328" name="__module.model.gpt_neox.layers.18.attention/aten::permute/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3105"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4329" name="__module.model.gpt_neox.layers.18.attention/prim::ListConstruct/Concat_2" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263463020" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="4330" name="__module.model.gpt_neox.layers.18.attention/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3110"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4331" name="self.model.gpt_neox.layers.18.attention.dense.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 4096" offset="3893166212" size="16777216" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4332" name="Convert_449658" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4333" name="self.model.gpt_neox.layers.18.attention.dense.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="3909943428" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4334" name="Convert_449661" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4335" name="self.model.gpt_neox.layers.18.attention.dense.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4336" name="self.model.gpt_neox.layers.18.attention.dense.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="3909947524" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4337" name="self.model.gpt_neox.layers.18.attention.dense.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4338" name="self.model.gpt_neox.layers.18.attention.dense.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4339" name="__module.model.gpt_neox.layers.18.attention.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4340" name="Constant_325376" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="3909955716" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4341" name="__module.model.gpt_neox.layers.18.attention.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3113,3115,input.75"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4342" name="__module.model.gpt_neox.layers.18/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3119,attn_output.75"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4343" name="__module.model.gpt_neox.layers.18.post_attention_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4344" name="__module.model.gpt_neox.layers.18.post_attention_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4345" name="Constant_325377" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="3909972100" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4346" name="__module.model.gpt_neox.layers.18.post_attention_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4347" name="Constant_325378" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="3909988484" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4348" name="__module.model.gpt_neox.layers.18.post_attention_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3123"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4349" name="self.model.gpt_neox.layers.18.mlp.dense_h_to_4h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 4096" offset="3910004868" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4350" name="Convert_449669" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4351" name="self.model.gpt_neox.layers.18.mlp.dense_h_to_4h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 1" offset="3977113732" size="16384" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4352" name="Convert_449672" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4353" name="self.model.gpt_neox.layers.18.mlp.dense_h_to_4h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4354" name="self.model.gpt_neox.layers.18.mlp.dense_h_to_4h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="16384, 1" offset="3977130116" size="32768" /> + <output> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4355" name="self.model.gpt_neox.layers.18.mlp.dense_h_to_4h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4356" name="self.model.gpt_neox.layers.18.mlp.dense_h_to_4h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4357" name="__module.model.gpt_neox.layers.18.mlp.dense_h_to_4h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="4358" name="Constant_325379" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 16384" offset="3977162884" size="65536" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="4359" name="__module.model.gpt_neox.layers.18.mlp.dense_h_to_4h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3128"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="4360" name="__module.model.gpt_neox.layers.18.mlp.act/aten::gelu/Gelu" type="Gelu" version="opset7"> + <data approximation_mode="ERF" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="3129"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="4361" name="self.model.gpt_neox.layers.18.mlp.dense_4h_to_h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 16384" offset="3977228420" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="4362" name="Convert_449680" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="4363" name="self.model.gpt_neox.layers.18.mlp.dense_4h_to_h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="4044337284" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4364" name="Convert_449683" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4365" name="self.model.gpt_neox.layers.18.mlp.dense_4h_to_h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="4366" name="self.model.gpt_neox.layers.18.mlp.dense_4h_to_h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="4044341380" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4367" name="self.model.gpt_neox.layers.18.mlp.dense_4h_to_h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="4368" name="self.model.gpt_neox.layers.18.mlp.dense_4h_to_h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="4369" name="__module.model.gpt_neox.layers.18.mlp.dense_4h_to_h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4370" name="Constant_325380" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="4044349572" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4371" name="__module.model.gpt_neox.layers.18.mlp.dense_4h_to_h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3132,input.77"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4372" name="__module.model.gpt_neox.layers.18/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3134,3136,hidden_states.39"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4373" name="__module.model.gpt_neox.layers.19.input_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4374" name="__module.model.gpt_neox.layers.19.input_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4375" name="Constant_325381" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="4044365956" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4376" name="__module.model.gpt_neox.layers.19.input_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4377" name="Constant_325382" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="4044382340" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4378" name="__module.model.gpt_neox.layers.19.input_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3146"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4379" name="self.model.gpt_neox.layers.19.attention.query_key_value.weight" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 4096" offset="4044398724" size="50331648" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4380" name="Convert_449691" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4381" name="self.model.gpt_neox.layers.19.attention.query_key_value.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 1" offset="4094730372" size="12288" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4382" name="Convert_449694" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4383" name="self.model.gpt_neox.layers.19.attention.query_key_value.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4384" name="self.model.gpt_neox.layers.19.attention.query_key_value.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="12288, 1" offset="4094742660" size="24576" /> + <output> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4385" name="self.model.gpt_neox.layers.19.attention.query_key_value.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4386" name="self.model.gpt_neox.layers.19.attention.query_key_value.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4387" name="__module.model.gpt_neox.layers.19.attention.query_key_value/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="4388" name="Constant_325383" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 12288" offset="4094767236" size="49152" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="4389" name="__module.model.gpt_neox.layers.19.attention.query_key_value/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3153,qkv.77"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="4390" name="__module.model.gpt_neox.layers.19.attention/prim::ListConstruct/Concat" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171232" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4391" name="__module.model.gpt_neox.layers.19.attention/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3157,qkv.79"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + </output> + </layer> + <layer id="4392" name="Constant_301052" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4393" name="Constant_301055" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4394" name="Constant_301058" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4395" name="__module.model.gpt_neox.layers.19.attention/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3158"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4396" name="Constant_11261" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="3159"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4397" name="__module.model.gpt_neox.layers.19.attention/aten::permute/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3160,query.115"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4398" name="Constant_301064" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4399" name="Constant_301067" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4400" name="Constant_301070" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4401" name="__module.model.gpt_neox.layers.19.attention/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3167,q.39"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4402" name="self.model.gpt_neox.layers.19.attention.rotary_emb.cos_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="257171392" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.19.attention.rotary_emb.cos_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4403" name="__module.model.gpt_neox.layers.19.attention.rotary_emb/aten::slice/Unsqueeze" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4404" name="Constant_301076" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4405" name="Constant_301079" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4406" name="Constant_301082" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4407" name="__module.model.gpt_neox.layers.19.attention/aten::slice/Slice_2" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3161"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4408" name="ShapeOf_339638" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4409" name="Constant_341027" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4410" name="Constant_339640" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4411" name="Gather_339641" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="3171"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4412" name="Constant_433132" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="4413" name="Constant_433125" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4414" name="Constant_433127" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4415" name="Constant_433129" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4416" name="Concat_433130" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4417" name="Broadcast_433133" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4418" name="ReadValue_417326" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.19.keypresent.19.key" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.19.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4419" name="Constant_402004" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4420" name="Gather_402005" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4421" name="ShapeOf_339643" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4422" name="Constant_339644" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4423" name="Constant_339645" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4424" name="Gather_339646" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="3173" /> + </output> + </layer> + <layer id="4425" name="Constant_337774" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4426" name="Reshape_340943" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4427" name="__module.model.gpt_neox.layers.19.attention/aten::add_/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="3172,3176,3177,seq_len.77"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4428" name="__module.model.gpt_neox.layers.19.attention.rotary_emb/aten::slice/Unsqueeze_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4429" name="__module.model.gpt_neox.layers.19.attention.rotary_emb/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3180,3183,cos.77"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4430" name="Constant_38341" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="4431" name="__module.model.gpt_neox.layers.19.attention/aten::index/Gather" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="3186"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4432" name="__module.model.gpt_neox.layers.19.attention/aten::unsqueeze/Unsqueeze" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="3187,cos.79"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4433" name="__module.model.gpt_neox.layers.19.attention/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3191"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4434" name="Constant_301087" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4435" name="Constant_301086" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4436" name="__module.model.gpt_neox.layers.19.attention/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4437" name="__module.model.gpt_neox.layers.19.attention/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="4438" name="__module.model.gpt_neox.layers.19.attention/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="3192,3197" /> + </output> + </layer> + <layer id="4439" name="__module.model.gpt_neox.layers.19.attention/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="4440" name="__module.model.gpt_neox.layers.19.attention/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="3194,3195,3199,3200" /> + </output> + </layer> + <layer id="4441" name="Constant_337776" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4442" name="__module.model.gpt_neox.layers.19.attention/aten::slice/Unsqueeze_17" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4443" name="Constant_301085" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4444" name="ScatterUpdate_301088" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4445" name="Constant_301091" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4446" name="Constant_301094" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4447" name="__module.model.gpt_neox.layers.19.attention/aten::slice/Slice_3" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3201,x2.77"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="4448" name="Constant_325384" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4449" name="__module.model.gpt_neox.layers.19.attention/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3202"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="4450" name="Constant_301139" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4451" name="Constant_301144" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4452" name="__module.model.gpt_neox.layers.19.attention/aten::slice/Slice_4" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3196"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="4453" name="__module.model.gpt_neox.layers.19.attention/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3204"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4454" name="self.model.gpt_neox.layers.19.attention.rotary_emb.sin_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="258220060" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.19.attention.rotary_emb.sin_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4455" name="__module.model.gpt_neox.layers.19.attention.rotary_emb/aten::slice/Unsqueeze_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4456" name="__module.model.gpt_neox.layers.19.attention.rotary_emb/aten::slice/Unsqueeze_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4457" name="__module.model.gpt_neox.layers.19.attention.rotary_emb/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3181,3184,sin.77"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4458" name="Constant_38344" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="4459" name="__module.model.gpt_neox.layers.19.attention/aten::index/Gather_1" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="3189"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4460" name="__module.model.gpt_neox.layers.19.attention/aten::unsqueeze/Unsqueeze_1" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="3190,sin.79"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4461" name="__module.model.gpt_neox.layers.19.attention/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3205"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4462" name="__module.model.gpt_neox.layers.19.attention/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3206,3224,3234,query.117,query.119"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4463" name="Constant_11275" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="3162"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4464" name="__module.model.gpt_neox.layers.19.attention/aten::permute/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3163,key.115"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4465" name="Constant_301190" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4466" name="Constant_301193" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4467" name="Constant_301196" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4468" name="__module.model.gpt_neox.layers.19.attention/aten::slice/Slice_6" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3169,k.39"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4469" name="__module.model.gpt_neox.layers.19.attention/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3207"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4470" name="Constant_301200" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4471" name="Constant_301199" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4472" name="__module.model.gpt_neox.layers.19.attention/aten::size/ShapeOf_7" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4473" name="__module.model.gpt_neox.layers.19.attention/aten::size/Constant_7" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="4474" name="__module.model.gpt_neox.layers.19.attention/aten::size/Gather_7" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="3208,3213" /> + </output> + </layer> + <layer id="4475" name="__module.model.gpt_neox.layers.19.attention/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="4476" name="__module.model.gpt_neox.layers.19.attention/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="3210,3211,3215,3216" /> + </output> + </layer> + <layer id="4477" name="Constant_337778" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4478" name="__module.model.gpt_neox.layers.19.attention/aten::slice/Unsqueeze_33" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4479" name="Constant_301198" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4480" name="ScatterUpdate_301201" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4481" name="Constant_301204" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4482" name="Constant_301207" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4483" name="__module.model.gpt_neox.layers.19.attention/aten::slice/Slice_7" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3217,x2.79"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="4484" name="Constant_325385" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4485" name="__module.model.gpt_neox.layers.19.attention/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3218"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="4486" name="Constant_301252" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4487" name="Constant_301257" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4488" name="__module.model.gpt_neox.layers.19.attention/aten::slice/Slice_8" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3212"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="4489" name="__module.model.gpt_neox.layers.19.attention/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3220"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4490" name="__module.model.gpt_neox.layers.19.attention/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3221"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4491" name="__module.model.gpt_neox.layers.19.attention/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3222,3226"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4492" name="__module.model.gpt_neox.layers.19.attention/aten::to/Convert_1" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.19.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4493" name="Constant_433145" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="4494" name="Constant_433138" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4495" name="Constant_433140" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4496" name="Constant_433142" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4497" name="Concat_433143" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4498" name="Broadcast_433146" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4499" name="ReadValue_417328" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.19.valuepresent.19.value" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.19.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4500" name="Constant_402007" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4501" name="Gather_402008" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4502" name="Constant_301302" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4503" name="Constant_301305" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4504" name="Constant_301308" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4505" name="__module.model.gpt_neox.layers.19.attention/aten::slice/Slice_10" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3164"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4506" name="Constant_11289" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="3165"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4507" name="__module.model.gpt_neox.layers.19.attention/aten::permute/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3166"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4508" name="__module.model.gpt_neox.layers.19.attention/aten::cat/Concat_5" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.19.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4509" name="__module.model.gpt_neox.layers.19.attention/aten::slice/Slice_11" type="Const" version="opset1"> + <data element_type="boolean" shape="1, 1, 2048, 2048" offset="259268636" size="4194304" /> + <output> + <port id="0" precision="BOOL" names="3243"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="4510" name="Constant_301312" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="4511" name="Constant_301311" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4512" name="ShapeOf_339648" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4513" name="Constant_339649" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4514" name="Constant_339650" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4515" name="Gather_339651" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" /> + </output> + </layer> + <layer id="4516" name="Add_339652" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="3238" /> + </output> + </layer> + <layer id="4517" name="ShapeOf_339719" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4518" name="Constant_339720" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4519" name="Constant_339721" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4520" name="Gather_339722" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="3236" /> + </output> + </layer> + <layer id="4521" name="__module.model.gpt_neox.layers.19.attention/aten::sub/Subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="3240,3241" /> + </output> + </layer> + <layer id="4522" name="Constant_337780" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4523" name="__module.model.gpt_neox.layers.19.attention/aten::slice/Unsqueeze_44" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4524" name="Constant_301310" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4525" name="ScatterUpdate_301313" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="4526" name="Constant_301314" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="4527" name="Constant_337782" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4528" name="__module.model.gpt_neox.layers.19.attention/aten::slice/Unsqueeze_45" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4529" name="ScatterUpdate_301315" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="4530" name="Constant_301318" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462964" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="4531" name="__module.model.gpt_neox.layers.19.attention/aten::slice/Slice_12" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 0" end_mask="1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + <port id="2" precision="I64"> + <dim>3</dim> + </port> + <port id="3" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="3244"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="4532" name="Constant_301391" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4533" name="Constant_301392" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4534" name="Constant_301388" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4535" name="Constant_301387" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4536" name="ScatterUpdate_301393" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4537" name="Constant_301396" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4538" name="__module.model.gpt_neox.layers.19.attention/aten::slice/Slice_13" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="3245,3246"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="4539" name="__module.model.gpt_neox.layers.19.attention/aten::where/Convert_1" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="4540" name="__module.model.gpt_neox.layers.19.attention/aten::full/Convert" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="263462988" size="4" /> + <output> + <port id="0" precision="FP32" names="3233" /> + </output> + </layer> + <layer id="4541" name="__module.model.gpt_neox.layers.19.attention/aten::where/Select" type="Select" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32" /> + <port id="2" precision="FP32" /> + </input> + <output> + <port id="3" precision="FP32" names="3247,causal_mask.77"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="4542" name="Add_316356" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="4543" name="ShapeOf_316357" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4544" name="Constant_339725" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4545" name="Constant_339726" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4546" name="Gather_339727" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="3231"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4547" name="Constant_268151" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4548" name="Constant_268153" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4549" name="Constant_268155" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4550" name="__module.model.gpt_neox.layers.19.attention/prim::ListConstruct/Concat_1" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="3248"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4551" name="Maximum_316358" type="Maximum" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4552" name="__module.model.gpt_neox.layers.19.attention/aten::add/Add_2" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3250"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="4553" name="__module.model.gpt_neox.layers.19.attention/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3251,3252,sdpa_result.39,tensor.77"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4554" name="Constant_11730" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="3253"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4555" name="__module.model.gpt_neox.layers.19.attention/aten::permute/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3254"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4556" name="__module.model.gpt_neox.layers.19.attention/prim::ListConstruct/Concat_2" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263463020" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="4557" name="__module.model.gpt_neox.layers.19.attention/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3259"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4558" name="self.model.gpt_neox.layers.19.attention.dense.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 4096" offset="4094816388" size="16777216" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4559" name="Convert_449702" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4560" name="self.model.gpt_neox.layers.19.attention.dense.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="4111593604" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4561" name="Convert_449705" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4562" name="self.model.gpt_neox.layers.19.attention.dense.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4563" name="self.model.gpt_neox.layers.19.attention.dense.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="4111597700" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4564" name="self.model.gpt_neox.layers.19.attention.dense.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4565" name="self.model.gpt_neox.layers.19.attention.dense.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4566" name="__module.model.gpt_neox.layers.19.attention.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4567" name="Constant_325386" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="4111605892" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4568" name="__module.model.gpt_neox.layers.19.attention.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3262,3264,input.79"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4569" name="__module.model.gpt_neox.layers.19/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3268,attn_output.79"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4570" name="__module.model.gpt_neox.layers.19.post_attention_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4571" name="__module.model.gpt_neox.layers.19.post_attention_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4572" name="Constant_325387" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="4111622276" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4573" name="__module.model.gpt_neox.layers.19.post_attention_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4574" name="Constant_325388" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="4111638660" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4575" name="__module.model.gpt_neox.layers.19.post_attention_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3272"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4576" name="self.model.gpt_neox.layers.19.mlp.dense_h_to_4h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 4096" offset="4111655044" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4577" name="Convert_449713" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4578" name="self.model.gpt_neox.layers.19.mlp.dense_h_to_4h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 1" offset="4178763908" size="16384" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4579" name="Convert_449716" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4580" name="self.model.gpt_neox.layers.19.mlp.dense_h_to_4h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4581" name="self.model.gpt_neox.layers.19.mlp.dense_h_to_4h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="16384, 1" offset="4178780292" size="32768" /> + <output> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4582" name="self.model.gpt_neox.layers.19.mlp.dense_h_to_4h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4583" name="self.model.gpt_neox.layers.19.mlp.dense_h_to_4h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4584" name="__module.model.gpt_neox.layers.19.mlp.dense_h_to_4h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="4585" name="Constant_325389" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 16384" offset="4178813060" size="65536" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="4586" name="__module.model.gpt_neox.layers.19.mlp.dense_h_to_4h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3277"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="4587" name="__module.model.gpt_neox.layers.19.mlp.act/aten::gelu/Gelu" type="Gelu" version="opset7"> + <data approximation_mode="ERF" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="3278"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="4588" name="self.model.gpt_neox.layers.19.mlp.dense_4h_to_h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 16384" offset="4178878596" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="4589" name="Convert_449724" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="4590" name="self.model.gpt_neox.layers.19.mlp.dense_4h_to_h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="4245987460" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4591" name="Convert_449727" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4592" name="self.model.gpt_neox.layers.19.mlp.dense_4h_to_h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="4593" name="self.model.gpt_neox.layers.19.mlp.dense_4h_to_h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="4245991556" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4594" name="self.model.gpt_neox.layers.19.mlp.dense_4h_to_h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="4595" name="self.model.gpt_neox.layers.19.mlp.dense_4h_to_h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="4596" name="__module.model.gpt_neox.layers.19.mlp.dense_4h_to_h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4597" name="Constant_325390" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="4245999748" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4598" name="__module.model.gpt_neox.layers.19.mlp.dense_4h_to_h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3281,input.81"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4599" name="__module.model.gpt_neox.layers.19/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3283,3285,hidden_states.41"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4600" name="__module.model.gpt_neox.layers.20.input_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4601" name="__module.model.gpt_neox.layers.20.input_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4602" name="Constant_325391" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="4246016132" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4603" name="__module.model.gpt_neox.layers.20.input_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4604" name="Constant_325392" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="4246032516" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4605" name="__module.model.gpt_neox.layers.20.input_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3295"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4606" name="self.model.gpt_neox.layers.20.attention.query_key_value.weight" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 4096" offset="4246048900" size="50331648" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4607" name="Convert_449735" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4608" name="self.model.gpt_neox.layers.20.attention.query_key_value.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 1" offset="4296380548" size="12288" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4609" name="Convert_449738" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4610" name="self.model.gpt_neox.layers.20.attention.query_key_value.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4611" name="self.model.gpt_neox.layers.20.attention.query_key_value.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="12288, 1" offset="4296392836" size="24576" /> + <output> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4612" name="self.model.gpt_neox.layers.20.attention.query_key_value.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4613" name="self.model.gpt_neox.layers.20.attention.query_key_value.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4614" name="__module.model.gpt_neox.layers.20.attention.query_key_value/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="4615" name="Constant_325393" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 12288" offset="4296417412" size="49152" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="4616" name="__module.model.gpt_neox.layers.20.attention.query_key_value/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3302,qkv.81"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="4617" name="__module.model.gpt_neox.layers.20.attention/prim::ListConstruct/Concat" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171232" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4618" name="__module.model.gpt_neox.layers.20.attention/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3306,qkv.83"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + </output> + </layer> + <layer id="4619" name="Constant_301403" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4620" name="Constant_301406" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4621" name="Constant_301409" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4622" name="__module.model.gpt_neox.layers.20.attention/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3307"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4623" name="Constant_11842" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="3308"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4624" name="__module.model.gpt_neox.layers.20.attention/aten::permute/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3309,query.121"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4625" name="Constant_301415" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4626" name="Constant_301418" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4627" name="Constant_301421" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4628" name="__module.model.gpt_neox.layers.20.attention/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3316,q.41"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4629" name="self.model.gpt_neox.layers.20.attention.rotary_emb.cos_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="257171392" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.20.attention.rotary_emb.cos_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4630" name="__module.model.gpt_neox.layers.20.attention.rotary_emb/aten::slice/Unsqueeze" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4631" name="Constant_301427" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4632" name="Constant_301430" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4633" name="Constant_301433" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4634" name="__module.model.gpt_neox.layers.20.attention/aten::slice/Slice_2" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3310"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4635" name="ShapeOf_339729" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4636" name="Constant_341030" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4637" name="Constant_339731" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4638" name="Gather_339732" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="3320"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4639" name="Constant_433158" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="4640" name="Constant_433151" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4641" name="Constant_433153" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4642" name="Constant_433155" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4643" name="Concat_433156" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4644" name="Broadcast_433159" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4645" name="ReadValue_417334" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.20.keypresent.20.key" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.20.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4646" name="Constant_402010" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4647" name="Gather_402011" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4648" name="ShapeOf_339734" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4649" name="Constant_339735" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4650" name="Constant_339736" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4651" name="Gather_339737" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="3322" /> + </output> + </layer> + <layer id="4652" name="Constant_337784" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4653" name="Reshape_340945" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4654" name="__module.model.gpt_neox.layers.20.attention/aten::add_/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="3321,3325,3326,seq_len.81"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4655" name="__module.model.gpt_neox.layers.20.attention.rotary_emb/aten::slice/Unsqueeze_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4656" name="__module.model.gpt_neox.layers.20.attention.rotary_emb/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3329,3332,cos.81"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4657" name="Constant_38347" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="4658" name="__module.model.gpt_neox.layers.20.attention/aten::index/Gather" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="3335"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4659" name="__module.model.gpt_neox.layers.20.attention/aten::unsqueeze/Unsqueeze" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="3336,cos.83"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4660" name="__module.model.gpt_neox.layers.20.attention/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3340"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4661" name="Constant_301438" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4662" name="Constant_301437" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4663" name="__module.model.gpt_neox.layers.20.attention/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4664" name="__module.model.gpt_neox.layers.20.attention/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="4665" name="__module.model.gpt_neox.layers.20.attention/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="3341,3346" /> + </output> + </layer> + <layer id="4666" name="__module.model.gpt_neox.layers.20.attention/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="4667" name="__module.model.gpt_neox.layers.20.attention/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="3343,3344,3348,3349" /> + </output> + </layer> + <layer id="4668" name="Constant_337786" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4669" name="__module.model.gpt_neox.layers.20.attention/aten::slice/Unsqueeze_17" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4670" name="Constant_301436" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4671" name="ScatterUpdate_301439" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4672" name="Constant_301442" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4673" name="Constant_301445" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4674" name="__module.model.gpt_neox.layers.20.attention/aten::slice/Slice_3" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3350,x2.81"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="4675" name="Constant_325394" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4676" name="__module.model.gpt_neox.layers.20.attention/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3351"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="4677" name="Constant_301490" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4678" name="Constant_301495" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4679" name="__module.model.gpt_neox.layers.20.attention/aten::slice/Slice_4" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3345"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="4680" name="__module.model.gpt_neox.layers.20.attention/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3353"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4681" name="self.model.gpt_neox.layers.20.attention.rotary_emb.sin_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="258220060" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.20.attention.rotary_emb.sin_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4682" name="__module.model.gpt_neox.layers.20.attention.rotary_emb/aten::slice/Unsqueeze_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4683" name="__module.model.gpt_neox.layers.20.attention.rotary_emb/aten::slice/Unsqueeze_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4684" name="__module.model.gpt_neox.layers.20.attention.rotary_emb/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3330,3333,sin.81"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4685" name="Constant_38350" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="4686" name="__module.model.gpt_neox.layers.20.attention/aten::index/Gather_1" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="3338"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4687" name="__module.model.gpt_neox.layers.20.attention/aten::unsqueeze/Unsqueeze_1" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="3339,sin.83"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4688" name="__module.model.gpt_neox.layers.20.attention/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3354"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4689" name="__module.model.gpt_neox.layers.20.attention/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3355,3373,3383,query.123,query.125"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4690" name="Constant_11856" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="3311"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4691" name="__module.model.gpt_neox.layers.20.attention/aten::permute/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3312,key.121"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4692" name="Constant_301541" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4693" name="Constant_301544" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4694" name="Constant_301547" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4695" name="__module.model.gpt_neox.layers.20.attention/aten::slice/Slice_6" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3318,k.41"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4696" name="__module.model.gpt_neox.layers.20.attention/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3356"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4697" name="Constant_301551" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4698" name="Constant_301550" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4699" name="__module.model.gpt_neox.layers.20.attention/aten::size/ShapeOf_7" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4700" name="__module.model.gpt_neox.layers.20.attention/aten::size/Constant_7" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="4701" name="__module.model.gpt_neox.layers.20.attention/aten::size/Gather_7" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="3357,3362" /> + </output> + </layer> + <layer id="4702" name="__module.model.gpt_neox.layers.20.attention/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="4703" name="__module.model.gpt_neox.layers.20.attention/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="3359,3360,3364,3365" /> + </output> + </layer> + <layer id="4704" name="Constant_337788" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4705" name="__module.model.gpt_neox.layers.20.attention/aten::slice/Unsqueeze_33" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4706" name="Constant_301549" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4707" name="ScatterUpdate_301552" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4708" name="Constant_301555" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4709" name="Constant_301558" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4710" name="__module.model.gpt_neox.layers.20.attention/aten::slice/Slice_7" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3366,x2.83"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="4711" name="Constant_325395" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4712" name="__module.model.gpt_neox.layers.20.attention/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3367"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="4713" name="Constant_301603" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4714" name="Constant_301608" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4715" name="__module.model.gpt_neox.layers.20.attention/aten::slice/Slice_8" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3361"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="4716" name="__module.model.gpt_neox.layers.20.attention/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3369"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4717" name="__module.model.gpt_neox.layers.20.attention/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3370"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4718" name="__module.model.gpt_neox.layers.20.attention/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3371,3375"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4719" name="__module.model.gpt_neox.layers.20.attention/aten::to/Convert_1" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.20.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4720" name="Constant_433171" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="4721" name="Constant_433164" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4722" name="Constant_433166" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4723" name="Constant_433168" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4724" name="Concat_433169" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4725" name="Broadcast_433172" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4726" name="ReadValue_417336" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.20.valuepresent.20.value" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.20.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4727" name="Constant_402013" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4728" name="Gather_402014" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4729" name="Constant_301653" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4730" name="Constant_301656" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4731" name="Constant_301659" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4732" name="__module.model.gpt_neox.layers.20.attention/aten::slice/Slice_10" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3313"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4733" name="Constant_11870" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="3314"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4734" name="__module.model.gpt_neox.layers.20.attention/aten::permute/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3315"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4735" name="__module.model.gpt_neox.layers.20.attention/aten::cat/Concat_5" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.20.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4736" name="__module.model.gpt_neox.layers.20.attention/aten::slice/Slice_11" type="Const" version="opset1"> + <data element_type="boolean" shape="1, 1, 2048, 2048" offset="259268636" size="4194304" /> + <output> + <port id="0" precision="BOOL" names="3392"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="4737" name="Constant_301663" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="4738" name="Constant_301662" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4739" name="ShapeOf_339739" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4740" name="Constant_339740" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4741" name="Constant_339741" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4742" name="Gather_339742" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" /> + </output> + </layer> + <layer id="4743" name="Add_339743" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="3387" /> + </output> + </layer> + <layer id="4744" name="ShapeOf_339810" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4745" name="Constant_339811" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4746" name="Constant_339812" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4747" name="Gather_339813" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="3385" /> + </output> + </layer> + <layer id="4748" name="__module.model.gpt_neox.layers.20.attention/aten::sub/Subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="3389,3390" /> + </output> + </layer> + <layer id="4749" name="Constant_337790" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4750" name="__module.model.gpt_neox.layers.20.attention/aten::slice/Unsqueeze_44" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4751" name="Constant_301661" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4752" name="ScatterUpdate_301664" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="4753" name="Constant_301665" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="4754" name="Constant_337792" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4755" name="__module.model.gpt_neox.layers.20.attention/aten::slice/Unsqueeze_45" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4756" name="ScatterUpdate_301666" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="4757" name="Constant_301669" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462964" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="4758" name="__module.model.gpt_neox.layers.20.attention/aten::slice/Slice_12" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 0" end_mask="1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + <port id="2" precision="I64"> + <dim>3</dim> + </port> + <port id="3" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="3393"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="4759" name="Constant_301742" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4760" name="Constant_301743" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4761" name="Constant_301739" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4762" name="Constant_301738" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4763" name="ScatterUpdate_301744" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4764" name="Constant_301747" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4765" name="__module.model.gpt_neox.layers.20.attention/aten::slice/Slice_13" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="3394,3395"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="4766" name="__module.model.gpt_neox.layers.20.attention/aten::where/Convert_1" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="4767" name="__module.model.gpt_neox.layers.20.attention/aten::full/Convert" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="263462988" size="4" /> + <output> + <port id="0" precision="FP32" names="3382" /> + </output> + </layer> + <layer id="4768" name="__module.model.gpt_neox.layers.20.attention/aten::where/Select" type="Select" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32" /> + <port id="2" precision="FP32" /> + </input> + <output> + <port id="3" precision="FP32" names="3396,causal_mask.81"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="4769" name="Add_316428" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="4770" name="ShapeOf_316429" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4771" name="Constant_339816" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4772" name="Constant_339817" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4773" name="Gather_339818" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="3380"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4774" name="Constant_268161" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4775" name="Constant_268163" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4776" name="Constant_268165" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4777" name="__module.model.gpt_neox.layers.20.attention/prim::ListConstruct/Concat_1" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="3397"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4778" name="Maximum_316430" type="Maximum" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4779" name="__module.model.gpt_neox.layers.20.attention/aten::add/Add_2" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3399"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="4780" name="__module.model.gpt_neox.layers.20.attention/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3400,3401,sdpa_result.41,tensor.81"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4781" name="Constant_12311" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="3402"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4782" name="__module.model.gpt_neox.layers.20.attention/aten::permute/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3403"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4783" name="__module.model.gpt_neox.layers.20.attention/prim::ListConstruct/Concat_2" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263463020" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="4784" name="__module.model.gpt_neox.layers.20.attention/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3408"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4785" name="self.model.gpt_neox.layers.20.attention.dense.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 4096" offset="4296466564" size="16777216" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4786" name="Convert_449746" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4787" name="self.model.gpt_neox.layers.20.attention.dense.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="4313243780" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4788" name="Convert_449749" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4789" name="self.model.gpt_neox.layers.20.attention.dense.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4790" name="self.model.gpt_neox.layers.20.attention.dense.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="4313247876" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4791" name="self.model.gpt_neox.layers.20.attention.dense.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4792" name="self.model.gpt_neox.layers.20.attention.dense.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4793" name="__module.model.gpt_neox.layers.20.attention.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4794" name="Constant_325396" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="4313256068" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4795" name="__module.model.gpt_neox.layers.20.attention.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3411,3413,input.83"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4796" name="__module.model.gpt_neox.layers.20/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3417,attn_output.83"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4797" name="__module.model.gpt_neox.layers.20.post_attention_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4798" name="__module.model.gpt_neox.layers.20.post_attention_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4799" name="Constant_325397" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="4313272452" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4800" name="__module.model.gpt_neox.layers.20.post_attention_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4801" name="Constant_325398" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="4313288836" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4802" name="__module.model.gpt_neox.layers.20.post_attention_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3421"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4803" name="self.model.gpt_neox.layers.20.mlp.dense_h_to_4h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 4096" offset="4313305220" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4804" name="Convert_449757" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4805" name="self.model.gpt_neox.layers.20.mlp.dense_h_to_4h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 1" offset="4380414084" size="16384" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4806" name="Convert_449760" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4807" name="self.model.gpt_neox.layers.20.mlp.dense_h_to_4h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4808" name="self.model.gpt_neox.layers.20.mlp.dense_h_to_4h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="16384, 1" offset="4380430468" size="32768" /> + <output> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4809" name="self.model.gpt_neox.layers.20.mlp.dense_h_to_4h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4810" name="self.model.gpt_neox.layers.20.mlp.dense_h_to_4h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4811" name="__module.model.gpt_neox.layers.20.mlp.dense_h_to_4h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="4812" name="Constant_325399" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 16384" offset="4380463236" size="65536" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="4813" name="__module.model.gpt_neox.layers.20.mlp.dense_h_to_4h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3426"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="4814" name="__module.model.gpt_neox.layers.20.mlp.act/aten::gelu/Gelu" type="Gelu" version="opset7"> + <data approximation_mode="ERF" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="3427"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="4815" name="self.model.gpt_neox.layers.20.mlp.dense_4h_to_h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 16384" offset="4380528772" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="4816" name="Convert_449768" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="4817" name="self.model.gpt_neox.layers.20.mlp.dense_4h_to_h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="4447637636" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4818" name="Convert_449771" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4819" name="self.model.gpt_neox.layers.20.mlp.dense_4h_to_h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="4820" name="self.model.gpt_neox.layers.20.mlp.dense_4h_to_h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="4447641732" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4821" name="self.model.gpt_neox.layers.20.mlp.dense_4h_to_h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="4822" name="self.model.gpt_neox.layers.20.mlp.dense_4h_to_h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="4823" name="__module.model.gpt_neox.layers.20.mlp.dense_4h_to_h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4824" name="Constant_325400" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="4447649924" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4825" name="__module.model.gpt_neox.layers.20.mlp.dense_4h_to_h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3430,input.85"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4826" name="__module.model.gpt_neox.layers.20/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3432,3434,hidden_states.43"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4827" name="__module.model.gpt_neox.layers.21.input_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4828" name="__module.model.gpt_neox.layers.21.input_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4829" name="Constant_325401" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="4447666308" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4830" name="__module.model.gpt_neox.layers.21.input_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4831" name="Constant_325402" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="4447682692" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4832" name="__module.model.gpt_neox.layers.21.input_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3444"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4833" name="self.model.gpt_neox.layers.21.attention.query_key_value.weight" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 4096" offset="4447699076" size="50331648" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4834" name="Convert_449779" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4835" name="self.model.gpt_neox.layers.21.attention.query_key_value.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 1" offset="4498030724" size="12288" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4836" name="Convert_449782" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4837" name="self.model.gpt_neox.layers.21.attention.query_key_value.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4838" name="self.model.gpt_neox.layers.21.attention.query_key_value.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="12288, 1" offset="4498043012" size="24576" /> + <output> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4839" name="self.model.gpt_neox.layers.21.attention.query_key_value.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4840" name="self.model.gpt_neox.layers.21.attention.query_key_value.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="4841" name="__module.model.gpt_neox.layers.21.attention.query_key_value/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="4842" name="Constant_325403" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 12288" offset="4498067588" size="49152" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="4843" name="__module.model.gpt_neox.layers.21.attention.query_key_value/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3451,qkv.85"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="4844" name="__module.model.gpt_neox.layers.21.attention/prim::ListConstruct/Concat" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171232" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4845" name="__module.model.gpt_neox.layers.21.attention/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3455,qkv.87"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + </output> + </layer> + <layer id="4846" name="Constant_301754" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4847" name="Constant_301757" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4848" name="Constant_301760" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4849" name="__module.model.gpt_neox.layers.21.attention/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3456"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4850" name="Constant_12423" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="3457"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4851" name="__module.model.gpt_neox.layers.21.attention/aten::permute/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3458,query.127"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4852" name="Constant_301766" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4853" name="Constant_301769" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4854" name="Constant_301772" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4855" name="__module.model.gpt_neox.layers.21.attention/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3465,q.43"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4856" name="self.model.gpt_neox.layers.21.attention.rotary_emb.cos_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="257171392" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.21.attention.rotary_emb.cos_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4857" name="__module.model.gpt_neox.layers.21.attention.rotary_emb/aten::slice/Unsqueeze" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4858" name="Constant_301778" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4859" name="Constant_301781" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4860" name="Constant_301784" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4861" name="__module.model.gpt_neox.layers.21.attention/aten::slice/Slice_2" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3459"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4862" name="ShapeOf_339820" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4863" name="Constant_341033" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4864" name="Constant_339822" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4865" name="Gather_339823" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="3469"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4866" name="Constant_433184" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="4867" name="Constant_433177" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4868" name="Constant_433179" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4869" name="Constant_433181" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4870" name="Concat_433182" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4871" name="Broadcast_433185" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4872" name="ReadValue_417338" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.21.keypresent.21.key" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.21.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4873" name="Constant_402016" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4874" name="Gather_402017" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4875" name="ShapeOf_339825" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4876" name="Constant_339826" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4877" name="Constant_339827" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4878" name="Gather_339828" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="3471" /> + </output> + </layer> + <layer id="4879" name="Constant_337794" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4880" name="Reshape_340947" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4881" name="__module.model.gpt_neox.layers.21.attention/aten::add_/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="3470,3474,3475,seq_len.85"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4882" name="__module.model.gpt_neox.layers.21.attention.rotary_emb/aten::slice/Unsqueeze_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4883" name="__module.model.gpt_neox.layers.21.attention.rotary_emb/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3478,3481,cos.85"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4884" name="Constant_38353" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="4885" name="__module.model.gpt_neox.layers.21.attention/aten::index/Gather" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="3484"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4886" name="__module.model.gpt_neox.layers.21.attention/aten::unsqueeze/Unsqueeze" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="3485,cos.87"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4887" name="__module.model.gpt_neox.layers.21.attention/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3489"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4888" name="Constant_301789" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4889" name="Constant_301788" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4890" name="__module.model.gpt_neox.layers.21.attention/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4891" name="__module.model.gpt_neox.layers.21.attention/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="4892" name="__module.model.gpt_neox.layers.21.attention/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="3490,3495" /> + </output> + </layer> + <layer id="4893" name="__module.model.gpt_neox.layers.21.attention/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="4894" name="__module.model.gpt_neox.layers.21.attention/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="3492,3493,3497,3498" /> + </output> + </layer> + <layer id="4895" name="Constant_337796" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4896" name="__module.model.gpt_neox.layers.21.attention/aten::slice/Unsqueeze_17" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4897" name="Constant_301787" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4898" name="ScatterUpdate_301790" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4899" name="Constant_301793" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4900" name="Constant_301796" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4901" name="__module.model.gpt_neox.layers.21.attention/aten::slice/Slice_3" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3499,x2.85"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="4902" name="Constant_325404" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4903" name="__module.model.gpt_neox.layers.21.attention/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3500"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="4904" name="Constant_301841" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4905" name="Constant_301846" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4906" name="__module.model.gpt_neox.layers.21.attention/aten::slice/Slice_4" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3494"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="4907" name="__module.model.gpt_neox.layers.21.attention/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3502"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4908" name="self.model.gpt_neox.layers.21.attention.rotary_emb.sin_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="258220060" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.21.attention.rotary_emb.sin_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4909" name="__module.model.gpt_neox.layers.21.attention.rotary_emb/aten::slice/Unsqueeze_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4910" name="__module.model.gpt_neox.layers.21.attention.rotary_emb/aten::slice/Unsqueeze_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4911" name="__module.model.gpt_neox.layers.21.attention.rotary_emb/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3479,3482,sin.85"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4912" name="Constant_38356" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="4913" name="__module.model.gpt_neox.layers.21.attention/aten::index/Gather_1" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="3487"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4914" name="__module.model.gpt_neox.layers.21.attention/aten::unsqueeze/Unsqueeze_1" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="3488,sin.87"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4915" name="__module.model.gpt_neox.layers.21.attention/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3503"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4916" name="__module.model.gpt_neox.layers.21.attention/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3504,3522,3532,query.129,query.131"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4917" name="Constant_12437" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="3460"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4918" name="__module.model.gpt_neox.layers.21.attention/aten::permute/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3461,key.127"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4919" name="Constant_301892" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4920" name="Constant_301895" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4921" name="Constant_301898" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4922" name="__module.model.gpt_neox.layers.21.attention/aten::slice/Slice_6" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3467,k.43"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4923" name="__module.model.gpt_neox.layers.21.attention/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3505"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4924" name="Constant_301902" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4925" name="Constant_301901" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4926" name="__module.model.gpt_neox.layers.21.attention/aten::size/ShapeOf_7" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4927" name="__module.model.gpt_neox.layers.21.attention/aten::size/Constant_7" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="4928" name="__module.model.gpt_neox.layers.21.attention/aten::size/Gather_7" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="3506,3511" /> + </output> + </layer> + <layer id="4929" name="__module.model.gpt_neox.layers.21.attention/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="4930" name="__module.model.gpt_neox.layers.21.attention/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="3508,3509,3513,3514" /> + </output> + </layer> + <layer id="4931" name="Constant_337798" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4932" name="__module.model.gpt_neox.layers.21.attention/aten::slice/Unsqueeze_33" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4933" name="Constant_301900" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4934" name="ScatterUpdate_301903" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4935" name="Constant_301906" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4936" name="Constant_301909" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4937" name="__module.model.gpt_neox.layers.21.attention/aten::slice/Slice_7" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3515,x2.87"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="4938" name="Constant_325405" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4939" name="__module.model.gpt_neox.layers.21.attention/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3516"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="4940" name="Constant_301954" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4941" name="Constant_301959" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4942" name="__module.model.gpt_neox.layers.21.attention/aten::slice/Slice_8" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3510"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="4943" name="__module.model.gpt_neox.layers.21.attention/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3518"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4944" name="__module.model.gpt_neox.layers.21.attention/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3519"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4945" name="__module.model.gpt_neox.layers.21.attention/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3520,3524"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4946" name="__module.model.gpt_neox.layers.21.attention/aten::to/Convert_1" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.21.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4947" name="Constant_433197" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="4948" name="Constant_433190" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4949" name="Constant_433192" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4950" name="Constant_433194" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4951" name="Concat_433195" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4952" name="Broadcast_433198" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4953" name="ReadValue_417340" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.21.valuepresent.21.value" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.21.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4954" name="Constant_402019" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4955" name="Gather_402020" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4956" name="Constant_302004" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4957" name="Constant_302007" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4958" name="Constant_302010" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4959" name="__module.model.gpt_neox.layers.21.attention/aten::slice/Slice_10" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3462"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4960" name="Constant_12451" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="3463"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4961" name="__module.model.gpt_neox.layers.21.attention/aten::permute/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3464"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4962" name="__module.model.gpt_neox.layers.21.attention/aten::cat/Concat_5" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.21.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4963" name="__module.model.gpt_neox.layers.21.attention/aten::slice/Slice_11" type="Const" version="opset1"> + <data element_type="boolean" shape="1, 1, 2048, 2048" offset="259268636" size="4194304" /> + <output> + <port id="0" precision="BOOL" names="3541"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="4964" name="Constant_302014" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="4965" name="Constant_302013" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4966" name="ShapeOf_339830" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4967" name="Constant_339831" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4968" name="Constant_339832" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4969" name="Gather_339833" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" /> + </output> + </layer> + <layer id="4970" name="Add_339834" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="3536" /> + </output> + </layer> + <layer id="4971" name="ShapeOf_339901" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4972" name="Constant_339902" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4973" name="Constant_339903" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4974" name="Gather_339904" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="3534" /> + </output> + </layer> + <layer id="4975" name="__module.model.gpt_neox.layers.21.attention/aten::sub/Subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="3538,3539" /> + </output> + </layer> + <layer id="4976" name="Constant_337800" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4977" name="__module.model.gpt_neox.layers.21.attention/aten::slice/Unsqueeze_44" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4978" name="Constant_302012" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4979" name="ScatterUpdate_302015" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="4980" name="Constant_302016" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="4981" name="Constant_337802" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4982" name="__module.model.gpt_neox.layers.21.attention/aten::slice/Unsqueeze_45" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4983" name="ScatterUpdate_302017" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="4984" name="Constant_302020" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462964" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="4985" name="__module.model.gpt_neox.layers.21.attention/aten::slice/Slice_12" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 0" end_mask="1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + <port id="2" precision="I64"> + <dim>3</dim> + </port> + <port id="3" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="3542"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="4986" name="Constant_302093" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4987" name="Constant_302094" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4988" name="Constant_302090" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4989" name="Constant_302089" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4990" name="ScatterUpdate_302095" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4991" name="Constant_302098" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4992" name="__module.model.gpt_neox.layers.21.attention/aten::slice/Slice_13" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="3543,3544"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="4993" name="__module.model.gpt_neox.layers.21.attention/aten::where/Convert_1" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="4994" name="__module.model.gpt_neox.layers.21.attention/aten::full/Convert" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="263462988" size="4" /> + <output> + <port id="0" precision="FP32" names="3531" /> + </output> + </layer> + <layer id="4995" name="__module.model.gpt_neox.layers.21.attention/aten::where/Select" type="Select" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32" /> + <port id="2" precision="FP32" /> + </input> + <output> + <port id="3" precision="FP32" names="3545,causal_mask.85"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="4996" name="Add_316500" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="4997" name="ShapeOf_316501" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4998" name="Constant_339907" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4999" name="Constant_339908" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5000" name="Gather_339909" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="3529"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5001" name="Constant_268171" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5002" name="Constant_268173" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5003" name="Constant_268175" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5004" name="__module.model.gpt_neox.layers.21.attention/prim::ListConstruct/Concat_1" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="3546"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5005" name="Maximum_316502" type="Maximum" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5006" name="__module.model.gpt_neox.layers.21.attention/aten::add/Add_2" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3548"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="5007" name="__module.model.gpt_neox.layers.21.attention/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3549,3550,sdpa_result.43,tensor.85"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5008" name="Constant_12892" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="3551"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5009" name="__module.model.gpt_neox.layers.21.attention/aten::permute/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3552"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5010" name="__module.model.gpt_neox.layers.21.attention/prim::ListConstruct/Concat_2" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263463020" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="5011" name="__module.model.gpt_neox.layers.21.attention/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3557"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5012" name="self.model.gpt_neox.layers.21.attention.dense.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 4096" offset="4498116740" size="16777216" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5013" name="Convert_449790" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5014" name="self.model.gpt_neox.layers.21.attention.dense.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="4514893956" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5015" name="Convert_449793" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5016" name="self.model.gpt_neox.layers.21.attention.dense.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5017" name="self.model.gpt_neox.layers.21.attention.dense.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="4514898052" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5018" name="self.model.gpt_neox.layers.21.attention.dense.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5019" name="self.model.gpt_neox.layers.21.attention.dense.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5020" name="__module.model.gpt_neox.layers.21.attention.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5021" name="Constant_325406" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="4514906244" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5022" name="__module.model.gpt_neox.layers.21.attention.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3560,3562,input.87"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5023" name="__module.model.gpt_neox.layers.21/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3566,attn_output.87"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5024" name="__module.model.gpt_neox.layers.21.post_attention_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5025" name="__module.model.gpt_neox.layers.21.post_attention_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5026" name="Constant_325407" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="4514922628" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5027" name="__module.model.gpt_neox.layers.21.post_attention_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5028" name="Constant_325408" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="4514939012" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5029" name="__module.model.gpt_neox.layers.21.post_attention_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3570"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5030" name="self.model.gpt_neox.layers.21.mlp.dense_h_to_4h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 4096" offset="4514955396" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5031" name="Convert_449801" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5032" name="self.model.gpt_neox.layers.21.mlp.dense_h_to_4h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 1" offset="4582064260" size="16384" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5033" name="Convert_449804" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5034" name="self.model.gpt_neox.layers.21.mlp.dense_h_to_4h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5035" name="self.model.gpt_neox.layers.21.mlp.dense_h_to_4h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="16384, 1" offset="4582080644" size="32768" /> + <output> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5036" name="self.model.gpt_neox.layers.21.mlp.dense_h_to_4h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5037" name="self.model.gpt_neox.layers.21.mlp.dense_h_to_4h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5038" name="__module.model.gpt_neox.layers.21.mlp.dense_h_to_4h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="5039" name="Constant_325409" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 16384" offset="4582113412" size="65536" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="5040" name="__module.model.gpt_neox.layers.21.mlp.dense_h_to_4h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3575"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="5041" name="__module.model.gpt_neox.layers.21.mlp.act/aten::gelu/Gelu" type="Gelu" version="opset7"> + <data approximation_mode="ERF" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="3576"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="5042" name="self.model.gpt_neox.layers.21.mlp.dense_4h_to_h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 16384" offset="4582178948" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="5043" name="Convert_449812" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="5044" name="self.model.gpt_neox.layers.21.mlp.dense_4h_to_h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="4649287812" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5045" name="Convert_449815" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5046" name="self.model.gpt_neox.layers.21.mlp.dense_4h_to_h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="5047" name="self.model.gpt_neox.layers.21.mlp.dense_4h_to_h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="4649291908" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5048" name="self.model.gpt_neox.layers.21.mlp.dense_4h_to_h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="5049" name="self.model.gpt_neox.layers.21.mlp.dense_4h_to_h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="5050" name="__module.model.gpt_neox.layers.21.mlp.dense_4h_to_h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5051" name="Constant_325410" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="4649300100" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5052" name="__module.model.gpt_neox.layers.21.mlp.dense_4h_to_h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3579,input.89"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5053" name="__module.model.gpt_neox.layers.21/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3581,3583,hidden_states.45"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5054" name="__module.model.gpt_neox.layers.22.input_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5055" name="__module.model.gpt_neox.layers.22.input_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5056" name="Constant_325411" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="4649316484" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5057" name="__module.model.gpt_neox.layers.22.input_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5058" name="Constant_325412" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="4649332868" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5059" name="__module.model.gpt_neox.layers.22.input_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3593"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5060" name="self.model.gpt_neox.layers.22.attention.query_key_value.weight" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 4096" offset="4649349252" size="50331648" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5061" name="Convert_449823" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5062" name="self.model.gpt_neox.layers.22.attention.query_key_value.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 1" offset="4699680900" size="12288" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5063" name="Convert_449826" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5064" name="self.model.gpt_neox.layers.22.attention.query_key_value.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5065" name="self.model.gpt_neox.layers.22.attention.query_key_value.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="12288, 1" offset="4699693188" size="24576" /> + <output> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5066" name="self.model.gpt_neox.layers.22.attention.query_key_value.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5067" name="self.model.gpt_neox.layers.22.attention.query_key_value.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5068" name="__module.model.gpt_neox.layers.22.attention.query_key_value/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="5069" name="Constant_325413" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 12288" offset="4699717764" size="49152" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="5070" name="__module.model.gpt_neox.layers.22.attention.query_key_value/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3600,qkv.89"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="5071" name="__module.model.gpt_neox.layers.22.attention/prim::ListConstruct/Concat" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171232" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5072" name="__module.model.gpt_neox.layers.22.attention/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3604,qkv.91"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + </output> + </layer> + <layer id="5073" name="Constant_302105" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5074" name="Constant_302108" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5075" name="Constant_302111" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5076" name="__module.model.gpt_neox.layers.22.attention/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3605"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5077" name="Constant_13004" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="3606"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5078" name="__module.model.gpt_neox.layers.22.attention/aten::permute/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3607,query.133"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5079" name="Constant_302117" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5080" name="Constant_302120" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5081" name="Constant_302123" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5082" name="__module.model.gpt_neox.layers.22.attention/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3614,q.45"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5083" name="self.model.gpt_neox.layers.22.attention.rotary_emb.cos_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="257171392" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.22.attention.rotary_emb.cos_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5084" name="__module.model.gpt_neox.layers.22.attention.rotary_emb/aten::slice/Unsqueeze" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5085" name="Constant_302129" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5086" name="Constant_302132" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5087" name="Constant_302135" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5088" name="__module.model.gpt_neox.layers.22.attention/aten::slice/Slice_2" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3608"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5089" name="ShapeOf_339911" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5090" name="Constant_341036" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5091" name="Constant_339913" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5092" name="Gather_339914" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="3618"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5093" name="Constant_433210" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="5094" name="Constant_433203" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5095" name="Constant_433205" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5096" name="Constant_433207" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5097" name="Concat_433208" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5098" name="Broadcast_433211" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5099" name="ReadValue_417342" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.22.keypresent.22.key" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.22.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5100" name="Constant_402022" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5101" name="Gather_402023" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5102" name="ShapeOf_339916" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5103" name="Constant_339917" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5104" name="Constant_339918" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5105" name="Gather_339919" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="3620" /> + </output> + </layer> + <layer id="5106" name="Constant_337804" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5107" name="Reshape_340949" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5108" name="__module.model.gpt_neox.layers.22.attention/aten::add_/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="3619,3623,3624,seq_len.89"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5109" name="__module.model.gpt_neox.layers.22.attention.rotary_emb/aten::slice/Unsqueeze_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5110" name="__module.model.gpt_neox.layers.22.attention.rotary_emb/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3627,3630,cos.89"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5111" name="Constant_38359" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="5112" name="__module.model.gpt_neox.layers.22.attention/aten::index/Gather" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="3633"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5113" name="__module.model.gpt_neox.layers.22.attention/aten::unsqueeze/Unsqueeze" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="3634,cos.91"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5114" name="__module.model.gpt_neox.layers.22.attention/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3638"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5115" name="Constant_302140" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5116" name="Constant_302139" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5117" name="__module.model.gpt_neox.layers.22.attention/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5118" name="__module.model.gpt_neox.layers.22.attention/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="5119" name="__module.model.gpt_neox.layers.22.attention/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="3639,3644" /> + </output> + </layer> + <layer id="5120" name="__module.model.gpt_neox.layers.22.attention/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="5121" name="__module.model.gpt_neox.layers.22.attention/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="3641,3642,3646,3647" /> + </output> + </layer> + <layer id="5122" name="Constant_337806" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5123" name="__module.model.gpt_neox.layers.22.attention/aten::slice/Unsqueeze_17" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5124" name="Constant_302138" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5125" name="ScatterUpdate_302141" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5126" name="Constant_302144" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5127" name="Constant_302147" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5128" name="__module.model.gpt_neox.layers.22.attention/aten::slice/Slice_3" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3648,x2.89"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="5129" name="Constant_325414" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5130" name="__module.model.gpt_neox.layers.22.attention/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3649"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="5131" name="Constant_302192" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5132" name="Constant_302197" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5133" name="__module.model.gpt_neox.layers.22.attention/aten::slice/Slice_4" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3643"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="5134" name="__module.model.gpt_neox.layers.22.attention/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3651"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5135" name="self.model.gpt_neox.layers.22.attention.rotary_emb.sin_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="258220060" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.22.attention.rotary_emb.sin_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5136" name="__module.model.gpt_neox.layers.22.attention.rotary_emb/aten::slice/Unsqueeze_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5137" name="__module.model.gpt_neox.layers.22.attention.rotary_emb/aten::slice/Unsqueeze_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5138" name="__module.model.gpt_neox.layers.22.attention.rotary_emb/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3628,3631,sin.89"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5139" name="Constant_38362" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="5140" name="__module.model.gpt_neox.layers.22.attention/aten::index/Gather_1" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="3636"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5141" name="__module.model.gpt_neox.layers.22.attention/aten::unsqueeze/Unsqueeze_1" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="3637,sin.91"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5142" name="__module.model.gpt_neox.layers.22.attention/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3652"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5143" name="__module.model.gpt_neox.layers.22.attention/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3653,3671,3681,query.135,query.137"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5144" name="Constant_13018" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="3609"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5145" name="__module.model.gpt_neox.layers.22.attention/aten::permute/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3610,key.133"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5146" name="Constant_302243" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5147" name="Constant_302246" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5148" name="Constant_302249" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5149" name="__module.model.gpt_neox.layers.22.attention/aten::slice/Slice_6" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3616,k.45"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5150" name="__module.model.gpt_neox.layers.22.attention/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3654"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5151" name="Constant_302253" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5152" name="Constant_302252" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5153" name="__module.model.gpt_neox.layers.22.attention/aten::size/ShapeOf_7" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5154" name="__module.model.gpt_neox.layers.22.attention/aten::size/Constant_7" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="5155" name="__module.model.gpt_neox.layers.22.attention/aten::size/Gather_7" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="3655,3660" /> + </output> + </layer> + <layer id="5156" name="__module.model.gpt_neox.layers.22.attention/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="5157" name="__module.model.gpt_neox.layers.22.attention/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="3657,3658,3662,3663" /> + </output> + </layer> + <layer id="5158" name="Constant_337808" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5159" name="__module.model.gpt_neox.layers.22.attention/aten::slice/Unsqueeze_33" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5160" name="Constant_302251" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5161" name="ScatterUpdate_302254" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5162" name="Constant_302257" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5163" name="Constant_302260" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5164" name="__module.model.gpt_neox.layers.22.attention/aten::slice/Slice_7" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3664,x2.91"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="5165" name="Constant_325415" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5166" name="__module.model.gpt_neox.layers.22.attention/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3665"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="5167" name="Constant_302305" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5168" name="Constant_302310" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5169" name="__module.model.gpt_neox.layers.22.attention/aten::slice/Slice_8" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3659"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="5170" name="__module.model.gpt_neox.layers.22.attention/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3667"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5171" name="__module.model.gpt_neox.layers.22.attention/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3668"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5172" name="__module.model.gpt_neox.layers.22.attention/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3669,3673"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5173" name="__module.model.gpt_neox.layers.22.attention/aten::to/Convert_1" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.22.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5174" name="Constant_433223" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="5175" name="Constant_433216" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5176" name="Constant_433218" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5177" name="Constant_433220" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5178" name="Concat_433221" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5179" name="Broadcast_433224" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5180" name="ReadValue_417344" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.22.valuepresent.22.value" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.22.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5181" name="Constant_402025" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5182" name="Gather_402026" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5183" name="Constant_302355" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5184" name="Constant_302358" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5185" name="Constant_302361" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5186" name="__module.model.gpt_neox.layers.22.attention/aten::slice/Slice_10" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3611"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5187" name="Constant_13032" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="3612"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5188" name="__module.model.gpt_neox.layers.22.attention/aten::permute/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3613"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5189" name="__module.model.gpt_neox.layers.22.attention/aten::cat/Concat_5" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.22.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5190" name="__module.model.gpt_neox.layers.22.attention/aten::slice/Slice_11" type="Const" version="opset1"> + <data element_type="boolean" shape="1, 1, 2048, 2048" offset="259268636" size="4194304" /> + <output> + <port id="0" precision="BOOL" names="3690"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="5191" name="Constant_302365" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="5192" name="Constant_302364" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5193" name="ShapeOf_339921" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5194" name="Constant_339922" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5195" name="Constant_339923" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5196" name="Gather_339924" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" /> + </output> + </layer> + <layer id="5197" name="Add_339925" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="3685" /> + </output> + </layer> + <layer id="5198" name="ShapeOf_339992" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5199" name="Constant_339993" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5200" name="Constant_339994" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5201" name="Gather_339995" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="3683" /> + </output> + </layer> + <layer id="5202" name="__module.model.gpt_neox.layers.22.attention/aten::sub/Subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="3687,3688" /> + </output> + </layer> + <layer id="5203" name="Constant_337810" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5204" name="__module.model.gpt_neox.layers.22.attention/aten::slice/Unsqueeze_44" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5205" name="Constant_302363" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5206" name="ScatterUpdate_302366" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="5207" name="Constant_302367" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="5208" name="Constant_337812" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5209" name="__module.model.gpt_neox.layers.22.attention/aten::slice/Unsqueeze_45" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5210" name="ScatterUpdate_302368" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="5211" name="Constant_302371" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462964" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="5212" name="__module.model.gpt_neox.layers.22.attention/aten::slice/Slice_12" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 0" end_mask="1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + <port id="2" precision="I64"> + <dim>3</dim> + </port> + <port id="3" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="3691"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="5213" name="Constant_302444" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5214" name="Constant_302445" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5215" name="Constant_302441" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5216" name="Constant_302440" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5217" name="ScatterUpdate_302446" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5218" name="Constant_302449" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5219" name="__module.model.gpt_neox.layers.22.attention/aten::slice/Slice_13" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="3692,3693"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="5220" name="__module.model.gpt_neox.layers.22.attention/aten::where/Convert_1" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="5221" name="__module.model.gpt_neox.layers.22.attention/aten::full/Convert" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="263462988" size="4" /> + <output> + <port id="0" precision="FP32" names="3680" /> + </output> + </layer> + <layer id="5222" name="__module.model.gpt_neox.layers.22.attention/aten::where/Select" type="Select" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32" /> + <port id="2" precision="FP32" /> + </input> + <output> + <port id="3" precision="FP32" names="3694,causal_mask.89"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="5223" name="Add_316572" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="5224" name="ShapeOf_316573" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5225" name="Constant_339998" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5226" name="Constant_339999" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5227" name="Gather_340000" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="3678"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5228" name="Constant_268181" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5229" name="Constant_268183" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5230" name="Constant_268185" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5231" name="__module.model.gpt_neox.layers.22.attention/prim::ListConstruct/Concat_1" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="3695"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5232" name="Maximum_316574" type="Maximum" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5233" name="__module.model.gpt_neox.layers.22.attention/aten::add/Add_2" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3697"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="5234" name="__module.model.gpt_neox.layers.22.attention/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3698,3699,sdpa_result.45,tensor.89"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5235" name="Constant_13473" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="3700"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5236" name="__module.model.gpt_neox.layers.22.attention/aten::permute/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3701"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5237" name="__module.model.gpt_neox.layers.22.attention/prim::ListConstruct/Concat_2" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263463020" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="5238" name="__module.model.gpt_neox.layers.22.attention/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3706"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5239" name="self.model.gpt_neox.layers.22.attention.dense.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 4096" offset="4699766916" size="16777216" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5240" name="Convert_449834" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5241" name="self.model.gpt_neox.layers.22.attention.dense.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="4716544132" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5242" name="Convert_449837" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5243" name="self.model.gpt_neox.layers.22.attention.dense.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5244" name="self.model.gpt_neox.layers.22.attention.dense.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="4716548228" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5245" name="self.model.gpt_neox.layers.22.attention.dense.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5246" name="self.model.gpt_neox.layers.22.attention.dense.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5247" name="__module.model.gpt_neox.layers.22.attention.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5248" name="Constant_325416" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="4716556420" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5249" name="__module.model.gpt_neox.layers.22.attention.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3709,3711,input.91"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5250" name="__module.model.gpt_neox.layers.22/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3715,attn_output.91"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5251" name="__module.model.gpt_neox.layers.22.post_attention_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5252" name="__module.model.gpt_neox.layers.22.post_attention_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5253" name="Constant_325417" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="4716572804" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5254" name="__module.model.gpt_neox.layers.22.post_attention_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5255" name="Constant_325418" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="4716589188" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5256" name="__module.model.gpt_neox.layers.22.post_attention_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3719"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5257" name="self.model.gpt_neox.layers.22.mlp.dense_h_to_4h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 4096" offset="4716605572" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5258" name="Convert_449845" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5259" name="self.model.gpt_neox.layers.22.mlp.dense_h_to_4h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 1" offset="4783714436" size="16384" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5260" name="Convert_449848" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5261" name="self.model.gpt_neox.layers.22.mlp.dense_h_to_4h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5262" name="self.model.gpt_neox.layers.22.mlp.dense_h_to_4h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="16384, 1" offset="4783730820" size="32768" /> + <output> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5263" name="self.model.gpt_neox.layers.22.mlp.dense_h_to_4h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5264" name="self.model.gpt_neox.layers.22.mlp.dense_h_to_4h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5265" name="__module.model.gpt_neox.layers.22.mlp.dense_h_to_4h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="5266" name="Constant_325419" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 16384" offset="4783763588" size="65536" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="5267" name="__module.model.gpt_neox.layers.22.mlp.dense_h_to_4h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3724"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="5268" name="__module.model.gpt_neox.layers.22.mlp.act/aten::gelu/Gelu" type="Gelu" version="opset7"> + <data approximation_mode="ERF" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="3725"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="5269" name="self.model.gpt_neox.layers.22.mlp.dense_4h_to_h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 16384" offset="4783829124" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="5270" name="Convert_449856" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="5271" name="self.model.gpt_neox.layers.22.mlp.dense_4h_to_h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="4850937988" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5272" name="Convert_449859" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5273" name="self.model.gpt_neox.layers.22.mlp.dense_4h_to_h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="5274" name="self.model.gpt_neox.layers.22.mlp.dense_4h_to_h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="4850942084" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5275" name="self.model.gpt_neox.layers.22.mlp.dense_4h_to_h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="5276" name="self.model.gpt_neox.layers.22.mlp.dense_4h_to_h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="5277" name="__module.model.gpt_neox.layers.22.mlp.dense_4h_to_h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5278" name="Constant_325420" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="4850950276" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5279" name="__module.model.gpt_neox.layers.22.mlp.dense_4h_to_h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3728,input.93"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5280" name="__module.model.gpt_neox.layers.22/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3730,3732,hidden_states.47"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5281" name="__module.model.gpt_neox.layers.23.input_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5282" name="__module.model.gpt_neox.layers.23.input_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5283" name="Constant_325421" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="4850966660" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5284" name="__module.model.gpt_neox.layers.23.input_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5285" name="Constant_325422" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="4850983044" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5286" name="__module.model.gpt_neox.layers.23.input_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3742"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5287" name="self.model.gpt_neox.layers.23.attention.query_key_value.weight" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 4096" offset="4850999428" size="50331648" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5288" name="Convert_449867" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5289" name="self.model.gpt_neox.layers.23.attention.query_key_value.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 1" offset="4901331076" size="12288" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5290" name="Convert_449870" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5291" name="self.model.gpt_neox.layers.23.attention.query_key_value.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5292" name="self.model.gpt_neox.layers.23.attention.query_key_value.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="12288, 1" offset="4901343364" size="24576" /> + <output> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5293" name="self.model.gpt_neox.layers.23.attention.query_key_value.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5294" name="self.model.gpt_neox.layers.23.attention.query_key_value.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5295" name="__module.model.gpt_neox.layers.23.attention.query_key_value/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="5296" name="Constant_325423" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 12288" offset="4901367940" size="49152" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="5297" name="__module.model.gpt_neox.layers.23.attention.query_key_value/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3749,qkv.93"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="5298" name="__module.model.gpt_neox.layers.23.attention/prim::ListConstruct/Concat" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171232" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5299" name="__module.model.gpt_neox.layers.23.attention/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3753,qkv.95"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + </output> + </layer> + <layer id="5300" name="Constant_302456" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5301" name="Constant_302459" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5302" name="Constant_302462" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5303" name="__module.model.gpt_neox.layers.23.attention/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3754"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5304" name="Constant_13585" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="3755"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5305" name="__module.model.gpt_neox.layers.23.attention/aten::permute/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3756,query.139"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5306" name="Constant_302468" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5307" name="Constant_302471" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5308" name="Constant_302474" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5309" name="__module.model.gpt_neox.layers.23.attention/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3763,q.47"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5310" name="self.model.gpt_neox.layers.23.attention.rotary_emb.cos_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="257171392" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.23.attention.rotary_emb.cos_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5311" name="__module.model.gpt_neox.layers.23.attention.rotary_emb/aten::slice/Unsqueeze" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5312" name="Constant_302480" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5313" name="Constant_302483" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5314" name="Constant_302486" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5315" name="__module.model.gpt_neox.layers.23.attention/aten::slice/Slice_2" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3757"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5316" name="ShapeOf_340002" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5317" name="Constant_341039" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5318" name="Constant_340004" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5319" name="Gather_340005" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="3767"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5320" name="Constant_433236" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="5321" name="Constant_433229" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5322" name="Constant_433231" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5323" name="Constant_433233" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5324" name="Concat_433234" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5325" name="Broadcast_433237" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5326" name="ReadValue_417346" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.23.keypresent.23.key" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.23.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5327" name="Constant_402028" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5328" name="Gather_402029" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5329" name="ShapeOf_340007" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5330" name="Constant_340008" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5331" name="Constant_340009" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5332" name="Gather_340010" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="3769" /> + </output> + </layer> + <layer id="5333" name="Constant_337814" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5334" name="Reshape_340951" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5335" name="__module.model.gpt_neox.layers.23.attention/aten::add_/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="3768,3772,3773,seq_len.93"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5336" name="__module.model.gpt_neox.layers.23.attention.rotary_emb/aten::slice/Unsqueeze_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5337" name="__module.model.gpt_neox.layers.23.attention.rotary_emb/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3776,3779,cos.93"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5338" name="Constant_38365" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="5339" name="__module.model.gpt_neox.layers.23.attention/aten::index/Gather" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="3782"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5340" name="__module.model.gpt_neox.layers.23.attention/aten::unsqueeze/Unsqueeze" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="3783,cos.95"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5341" name="__module.model.gpt_neox.layers.23.attention/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3787"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5342" name="Constant_302491" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5343" name="Constant_302490" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5344" name="__module.model.gpt_neox.layers.23.attention/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5345" name="__module.model.gpt_neox.layers.23.attention/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="5346" name="__module.model.gpt_neox.layers.23.attention/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="3788,3793" /> + </output> + </layer> + <layer id="5347" name="__module.model.gpt_neox.layers.23.attention/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="5348" name="__module.model.gpt_neox.layers.23.attention/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="3790,3791,3795,3796" /> + </output> + </layer> + <layer id="5349" name="Constant_337816" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5350" name="__module.model.gpt_neox.layers.23.attention/aten::slice/Unsqueeze_17" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5351" name="Constant_302489" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5352" name="ScatterUpdate_302492" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5353" name="Constant_302495" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5354" name="Constant_302498" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5355" name="__module.model.gpt_neox.layers.23.attention/aten::slice/Slice_3" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3797,x2.93"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="5356" name="Constant_325424" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5357" name="__module.model.gpt_neox.layers.23.attention/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3798"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="5358" name="Constant_302543" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5359" name="Constant_302548" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5360" name="__module.model.gpt_neox.layers.23.attention/aten::slice/Slice_4" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3792"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="5361" name="__module.model.gpt_neox.layers.23.attention/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3800"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5362" name="self.model.gpt_neox.layers.23.attention.rotary_emb.sin_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="258220060" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.23.attention.rotary_emb.sin_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5363" name="__module.model.gpt_neox.layers.23.attention.rotary_emb/aten::slice/Unsqueeze_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5364" name="__module.model.gpt_neox.layers.23.attention.rotary_emb/aten::slice/Unsqueeze_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5365" name="__module.model.gpt_neox.layers.23.attention.rotary_emb/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3777,3780,sin.93"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5366" name="Constant_38368" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="5367" name="__module.model.gpt_neox.layers.23.attention/aten::index/Gather_1" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="3785"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5368" name="__module.model.gpt_neox.layers.23.attention/aten::unsqueeze/Unsqueeze_1" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="3786,sin.95"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5369" name="__module.model.gpt_neox.layers.23.attention/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3801"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5370" name="__module.model.gpt_neox.layers.23.attention/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3802,3820,3830,query.141,query.143"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5371" name="Constant_13599" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="3758"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5372" name="__module.model.gpt_neox.layers.23.attention/aten::permute/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3759,key.139"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5373" name="Constant_302594" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5374" name="Constant_302597" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5375" name="Constant_302600" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5376" name="__module.model.gpt_neox.layers.23.attention/aten::slice/Slice_6" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3765,k.47"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5377" name="__module.model.gpt_neox.layers.23.attention/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3803"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5378" name="Constant_302604" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5379" name="Constant_302603" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5380" name="__module.model.gpt_neox.layers.23.attention/aten::size/ShapeOf_7" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5381" name="__module.model.gpt_neox.layers.23.attention/aten::size/Constant_7" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="5382" name="__module.model.gpt_neox.layers.23.attention/aten::size/Gather_7" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="3804,3809" /> + </output> + </layer> + <layer id="5383" name="__module.model.gpt_neox.layers.23.attention/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="5384" name="__module.model.gpt_neox.layers.23.attention/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="3806,3807,3811,3812" /> + </output> + </layer> + <layer id="5385" name="Constant_337818" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5386" name="__module.model.gpt_neox.layers.23.attention/aten::slice/Unsqueeze_33" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5387" name="Constant_302602" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5388" name="ScatterUpdate_302605" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5389" name="Constant_302608" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5390" name="Constant_302611" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5391" name="__module.model.gpt_neox.layers.23.attention/aten::slice/Slice_7" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3813,x2.95"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="5392" name="Constant_325425" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5393" name="__module.model.gpt_neox.layers.23.attention/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3814"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="5394" name="Constant_302656" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5395" name="Constant_302661" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5396" name="__module.model.gpt_neox.layers.23.attention/aten::slice/Slice_8" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3808"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="5397" name="__module.model.gpt_neox.layers.23.attention/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3816"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5398" name="__module.model.gpt_neox.layers.23.attention/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3817"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5399" name="__module.model.gpt_neox.layers.23.attention/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3818,3822"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5400" name="__module.model.gpt_neox.layers.23.attention/aten::to/Convert_1" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.23.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5401" name="Constant_433249" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="5402" name="Constant_433242" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5403" name="Constant_433244" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5404" name="Constant_433246" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5405" name="Concat_433247" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5406" name="Broadcast_433250" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5407" name="ReadValue_417348" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.23.valuepresent.23.value" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.23.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5408" name="Constant_402031" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5409" name="Gather_402032" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5410" name="Constant_302706" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5411" name="Constant_302709" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5412" name="Constant_302712" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5413" name="__module.model.gpt_neox.layers.23.attention/aten::slice/Slice_10" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3760"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5414" name="Constant_13613" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="3761"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5415" name="__module.model.gpt_neox.layers.23.attention/aten::permute/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3762"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5416" name="__module.model.gpt_neox.layers.23.attention/aten::cat/Concat_5" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.23.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5417" name="__module.model.gpt_neox.layers.23.attention/aten::slice/Slice_11" type="Const" version="opset1"> + <data element_type="boolean" shape="1, 1, 2048, 2048" offset="259268636" size="4194304" /> + <output> + <port id="0" precision="BOOL" names="3839"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="5418" name="Constant_302716" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="5419" name="Constant_302715" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5420" name="ShapeOf_340012" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5421" name="Constant_340013" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5422" name="Constant_340014" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5423" name="Gather_340015" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" /> + </output> + </layer> + <layer id="5424" name="Add_340016" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="3834" /> + </output> + </layer> + <layer id="5425" name="ShapeOf_340083" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5426" name="Constant_340084" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5427" name="Constant_340085" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5428" name="Gather_340086" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="3832" /> + </output> + </layer> + <layer id="5429" name="__module.model.gpt_neox.layers.23.attention/aten::sub/Subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="3836,3837" /> + </output> + </layer> + <layer id="5430" name="Constant_337820" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5431" name="__module.model.gpt_neox.layers.23.attention/aten::slice/Unsqueeze_44" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5432" name="Constant_302714" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5433" name="ScatterUpdate_302717" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="5434" name="Constant_302718" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="5435" name="Constant_337822" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5436" name="__module.model.gpt_neox.layers.23.attention/aten::slice/Unsqueeze_45" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5437" name="ScatterUpdate_302719" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="5438" name="Constant_302722" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462964" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="5439" name="__module.model.gpt_neox.layers.23.attention/aten::slice/Slice_12" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 0" end_mask="1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + <port id="2" precision="I64"> + <dim>3</dim> + </port> + <port id="3" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="3840"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="5440" name="Constant_302795" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5441" name="Constant_302796" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5442" name="Constant_302792" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5443" name="Constant_302791" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5444" name="ScatterUpdate_302797" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5445" name="Constant_302800" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5446" name="__module.model.gpt_neox.layers.23.attention/aten::slice/Slice_13" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="3841,3842"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="5447" name="__module.model.gpt_neox.layers.23.attention/aten::where/Convert_1" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="5448" name="__module.model.gpt_neox.layers.23.attention/aten::full/Convert" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="263462988" size="4" /> + <output> + <port id="0" precision="FP32" names="3829" /> + </output> + </layer> + <layer id="5449" name="__module.model.gpt_neox.layers.23.attention/aten::where/Select" type="Select" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32" /> + <port id="2" precision="FP32" /> + </input> + <output> + <port id="3" precision="FP32" names="3843,causal_mask.93"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="5450" name="Add_316644" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="5451" name="ShapeOf_316645" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5452" name="Constant_340089" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5453" name="Constant_340090" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5454" name="Gather_340091" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="3827"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5455" name="Constant_268191" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5456" name="Constant_268193" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5457" name="Constant_268195" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5458" name="__module.model.gpt_neox.layers.23.attention/prim::ListConstruct/Concat_1" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="3844"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5459" name="Maximum_316646" type="Maximum" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5460" name="__module.model.gpt_neox.layers.23.attention/aten::add/Add_2" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3846"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="5461" name="__module.model.gpt_neox.layers.23.attention/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3847,3848,sdpa_result.47,tensor.93"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5462" name="Constant_14054" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="3849"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5463" name="__module.model.gpt_neox.layers.23.attention/aten::permute/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3850"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5464" name="__module.model.gpt_neox.layers.23.attention/prim::ListConstruct/Concat_2" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263463020" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="5465" name="__module.model.gpt_neox.layers.23.attention/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3855"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5466" name="self.model.gpt_neox.layers.23.attention.dense.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 4096" offset="4901417092" size="16777216" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5467" name="Convert_449878" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5468" name="self.model.gpt_neox.layers.23.attention.dense.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="4918194308" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5469" name="Convert_449881" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5470" name="self.model.gpt_neox.layers.23.attention.dense.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5471" name="self.model.gpt_neox.layers.23.attention.dense.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="4918198404" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5472" name="self.model.gpt_neox.layers.23.attention.dense.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5473" name="self.model.gpt_neox.layers.23.attention.dense.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5474" name="__module.model.gpt_neox.layers.23.attention.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5475" name="Constant_325426" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="4918206596" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5476" name="__module.model.gpt_neox.layers.23.attention.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3858,3860,input.95"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5477" name="__module.model.gpt_neox.layers.23/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3864,attn_output.95"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5478" name="__module.model.gpt_neox.layers.23.post_attention_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5479" name="__module.model.gpt_neox.layers.23.post_attention_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5480" name="Constant_325427" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="4918222980" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5481" name="__module.model.gpt_neox.layers.23.post_attention_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5482" name="Constant_325428" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="4918239364" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5483" name="__module.model.gpt_neox.layers.23.post_attention_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3868"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5484" name="self.model.gpt_neox.layers.23.mlp.dense_h_to_4h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 4096" offset="4918255748" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5485" name="Convert_449889" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5486" name="self.model.gpt_neox.layers.23.mlp.dense_h_to_4h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 1" offset="4985364612" size="16384" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5487" name="Convert_449892" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5488" name="self.model.gpt_neox.layers.23.mlp.dense_h_to_4h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5489" name="self.model.gpt_neox.layers.23.mlp.dense_h_to_4h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="16384, 1" offset="4985380996" size="32768" /> + <output> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5490" name="self.model.gpt_neox.layers.23.mlp.dense_h_to_4h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5491" name="self.model.gpt_neox.layers.23.mlp.dense_h_to_4h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5492" name="__module.model.gpt_neox.layers.23.mlp.dense_h_to_4h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="5493" name="Constant_325429" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 16384" offset="4985413764" size="65536" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="5494" name="__module.model.gpt_neox.layers.23.mlp.dense_h_to_4h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3873"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="5495" name="__module.model.gpt_neox.layers.23.mlp.act/aten::gelu/Gelu" type="Gelu" version="opset7"> + <data approximation_mode="ERF" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="3874"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="5496" name="self.model.gpt_neox.layers.23.mlp.dense_4h_to_h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 16384" offset="4985479300" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="5497" name="Convert_449900" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="5498" name="self.model.gpt_neox.layers.23.mlp.dense_4h_to_h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="5052588164" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5499" name="Convert_449903" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5500" name="self.model.gpt_neox.layers.23.mlp.dense_4h_to_h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="5501" name="self.model.gpt_neox.layers.23.mlp.dense_4h_to_h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="5052592260" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5502" name="self.model.gpt_neox.layers.23.mlp.dense_4h_to_h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="5503" name="self.model.gpt_neox.layers.23.mlp.dense_4h_to_h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="5504" name="__module.model.gpt_neox.layers.23.mlp.dense_4h_to_h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5505" name="Constant_325430" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="5052600452" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5506" name="__module.model.gpt_neox.layers.23.mlp.dense_4h_to_h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3877,input.97"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5507" name="__module.model.gpt_neox.layers.23/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3879,3881,hidden_states.49"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5508" name="__module.model.gpt_neox.layers.24.input_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5509" name="__module.model.gpt_neox.layers.24.input_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5510" name="Constant_325431" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="5052616836" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5511" name="__module.model.gpt_neox.layers.24.input_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5512" name="Constant_325432" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="5052633220" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5513" name="__module.model.gpt_neox.layers.24.input_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3891"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5514" name="self.model.gpt_neox.layers.24.attention.query_key_value.weight" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 4096" offset="5052649604" size="50331648" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5515" name="Convert_449911" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5516" name="self.model.gpt_neox.layers.24.attention.query_key_value.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 1" offset="5102981252" size="12288" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5517" name="Convert_449914" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5518" name="self.model.gpt_neox.layers.24.attention.query_key_value.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5519" name="self.model.gpt_neox.layers.24.attention.query_key_value.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="12288, 1" offset="5102993540" size="24576" /> + <output> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5520" name="self.model.gpt_neox.layers.24.attention.query_key_value.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5521" name="self.model.gpt_neox.layers.24.attention.query_key_value.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5522" name="__module.model.gpt_neox.layers.24.attention.query_key_value/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="5523" name="Constant_325433" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 12288" offset="5103018116" size="49152" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="5524" name="__module.model.gpt_neox.layers.24.attention.query_key_value/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3898,qkv.97"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="5525" name="__module.model.gpt_neox.layers.24.attention/prim::ListConstruct/Concat" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171232" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5526" name="__module.model.gpt_neox.layers.24.attention/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3902,qkv.99"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + </output> + </layer> + <layer id="5527" name="Constant_302807" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5528" name="Constant_302810" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5529" name="Constant_302813" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5530" name="__module.model.gpt_neox.layers.24.attention/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3903"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5531" name="Constant_14166" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="3904"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5532" name="__module.model.gpt_neox.layers.24.attention/aten::permute/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3905,query.145"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5533" name="Constant_302819" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5534" name="Constant_302822" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5535" name="Constant_302825" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5536" name="__module.model.gpt_neox.layers.24.attention/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3912,q.49"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5537" name="self.model.gpt_neox.layers.24.attention.rotary_emb.cos_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="257171392" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.24.attention.rotary_emb.cos_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5538" name="__module.model.gpt_neox.layers.24.attention.rotary_emb/aten::slice/Unsqueeze" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5539" name="Constant_302831" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5540" name="Constant_302834" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5541" name="Constant_302837" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5542" name="__module.model.gpt_neox.layers.24.attention/aten::slice/Slice_2" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3906"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5543" name="ShapeOf_340093" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5544" name="Constant_341042" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5545" name="Constant_340095" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5546" name="Gather_340096" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="3916"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5547" name="Constant_433262" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="5548" name="Constant_433255" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5549" name="Constant_433257" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5550" name="Constant_433259" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5551" name="Concat_433260" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5552" name="Broadcast_433263" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5553" name="ReadValue_417350" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.24.keypresent.24.key" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.24.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5554" name="Constant_402034" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5555" name="Gather_402035" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5556" name="ShapeOf_340098" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5557" name="Constant_340099" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5558" name="Constant_340100" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5559" name="Gather_340101" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="3918" /> + </output> + </layer> + <layer id="5560" name="Constant_337824" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5561" name="Reshape_340953" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5562" name="__module.model.gpt_neox.layers.24.attention/aten::add_/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="3917,3921,3922,seq_len.97"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5563" name="__module.model.gpt_neox.layers.24.attention.rotary_emb/aten::slice/Unsqueeze_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5564" name="__module.model.gpt_neox.layers.24.attention.rotary_emb/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3925,3928,cos.97"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5565" name="Constant_38371" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="5566" name="__module.model.gpt_neox.layers.24.attention/aten::index/Gather" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="3931"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5567" name="__module.model.gpt_neox.layers.24.attention/aten::unsqueeze/Unsqueeze" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="3932,cos.99"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5568" name="__module.model.gpt_neox.layers.24.attention/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3936"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5569" name="Constant_302842" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5570" name="Constant_302841" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5571" name="__module.model.gpt_neox.layers.24.attention/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5572" name="__module.model.gpt_neox.layers.24.attention/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="5573" name="__module.model.gpt_neox.layers.24.attention/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="3937,3942" /> + </output> + </layer> + <layer id="5574" name="__module.model.gpt_neox.layers.24.attention/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="5575" name="__module.model.gpt_neox.layers.24.attention/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="3939,3940,3944,3945" /> + </output> + </layer> + <layer id="5576" name="Constant_337826" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5577" name="__module.model.gpt_neox.layers.24.attention/aten::slice/Unsqueeze_17" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5578" name="Constant_302840" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5579" name="ScatterUpdate_302843" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5580" name="Constant_302846" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5581" name="Constant_302849" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5582" name="__module.model.gpt_neox.layers.24.attention/aten::slice/Slice_3" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3946,x2.97"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="5583" name="Constant_325434" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5584" name="__module.model.gpt_neox.layers.24.attention/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3947"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="5585" name="Constant_302894" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5586" name="Constant_302899" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5587" name="__module.model.gpt_neox.layers.24.attention/aten::slice/Slice_4" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3941"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="5588" name="__module.model.gpt_neox.layers.24.attention/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3949"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5589" name="self.model.gpt_neox.layers.24.attention.rotary_emb.sin_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="258220060" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.24.attention.rotary_emb.sin_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5590" name="__module.model.gpt_neox.layers.24.attention.rotary_emb/aten::slice/Unsqueeze_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5591" name="__module.model.gpt_neox.layers.24.attention.rotary_emb/aten::slice/Unsqueeze_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5592" name="__module.model.gpt_neox.layers.24.attention.rotary_emb/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3926,3929,sin.97"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5593" name="Constant_38374" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="5594" name="__module.model.gpt_neox.layers.24.attention/aten::index/Gather_1" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="3934"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5595" name="__module.model.gpt_neox.layers.24.attention/aten::unsqueeze/Unsqueeze_1" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="3935,sin.99"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5596" name="__module.model.gpt_neox.layers.24.attention/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3950"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5597" name="__module.model.gpt_neox.layers.24.attention/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3951,3969,3979,query.147,query.149"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5598" name="Constant_14180" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="3907"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5599" name="__module.model.gpt_neox.layers.24.attention/aten::permute/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3908,key.145"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5600" name="Constant_302945" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5601" name="Constant_302948" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5602" name="Constant_302951" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5603" name="__module.model.gpt_neox.layers.24.attention/aten::slice/Slice_6" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3914,k.49"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5604" name="__module.model.gpt_neox.layers.24.attention/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3952"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5605" name="Constant_302955" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5606" name="Constant_302954" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5607" name="__module.model.gpt_neox.layers.24.attention/aten::size/ShapeOf_7" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5608" name="__module.model.gpt_neox.layers.24.attention/aten::size/Constant_7" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="5609" name="__module.model.gpt_neox.layers.24.attention/aten::size/Gather_7" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="3953,3958" /> + </output> + </layer> + <layer id="5610" name="__module.model.gpt_neox.layers.24.attention/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="5611" name="__module.model.gpt_neox.layers.24.attention/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="3955,3956,3960,3961" /> + </output> + </layer> + <layer id="5612" name="Constant_337828" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5613" name="__module.model.gpt_neox.layers.24.attention/aten::slice/Unsqueeze_33" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5614" name="Constant_302953" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5615" name="ScatterUpdate_302956" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5616" name="Constant_302959" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5617" name="Constant_302962" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5618" name="__module.model.gpt_neox.layers.24.attention/aten::slice/Slice_7" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3962,x2.99"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="5619" name="Constant_325435" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5620" name="__module.model.gpt_neox.layers.24.attention/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3963"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="5621" name="Constant_303007" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5622" name="Constant_303012" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5623" name="__module.model.gpt_neox.layers.24.attention/aten::slice/Slice_8" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3957"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="5624" name="__module.model.gpt_neox.layers.24.attention/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3965"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5625" name="__module.model.gpt_neox.layers.24.attention/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3966"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5626" name="__module.model.gpt_neox.layers.24.attention/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3967,3971"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5627" name="__module.model.gpt_neox.layers.24.attention/aten::to/Convert_1" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.24.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5628" name="Constant_433275" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="5629" name="Constant_433268" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5630" name="Constant_433270" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5631" name="Constant_433272" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5632" name="Concat_433273" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5633" name="Broadcast_433276" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5634" name="ReadValue_417352" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.24.valuepresent.24.value" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.24.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5635" name="Constant_402037" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5636" name="Gather_402038" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5637" name="Constant_303057" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5638" name="Constant_303060" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5639" name="Constant_303063" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5640" name="__module.model.gpt_neox.layers.24.attention/aten::slice/Slice_10" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3909"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5641" name="Constant_14194" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="3910"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5642" name="__module.model.gpt_neox.layers.24.attention/aten::permute/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3911"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5643" name="__module.model.gpt_neox.layers.24.attention/aten::cat/Concat_5" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.24.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5644" name="__module.model.gpt_neox.layers.24.attention/aten::slice/Slice_11" type="Const" version="opset1"> + <data element_type="boolean" shape="1, 1, 2048, 2048" offset="259268636" size="4194304" /> + <output> + <port id="0" precision="BOOL" names="3988"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="5645" name="Constant_303067" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="5646" name="Constant_303066" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5647" name="ShapeOf_340103" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5648" name="Constant_340104" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5649" name="Constant_340105" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5650" name="Gather_340106" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" /> + </output> + </layer> + <layer id="5651" name="Add_340107" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="3983" /> + </output> + </layer> + <layer id="5652" name="ShapeOf_340174" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5653" name="Constant_340175" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5654" name="Constant_340176" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5655" name="Gather_340177" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="3981" /> + </output> + </layer> + <layer id="5656" name="__module.model.gpt_neox.layers.24.attention/aten::sub/Subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="3985,3986" /> + </output> + </layer> + <layer id="5657" name="Constant_337830" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5658" name="__module.model.gpt_neox.layers.24.attention/aten::slice/Unsqueeze_44" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5659" name="Constant_303065" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5660" name="ScatterUpdate_303068" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="5661" name="Constant_303069" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="5662" name="Constant_337832" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5663" name="__module.model.gpt_neox.layers.24.attention/aten::slice/Unsqueeze_45" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5664" name="ScatterUpdate_303070" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="5665" name="Constant_303073" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462964" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="5666" name="__module.model.gpt_neox.layers.24.attention/aten::slice/Slice_12" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 0" end_mask="1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + <port id="2" precision="I64"> + <dim>3</dim> + </port> + <port id="3" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="3989"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="5667" name="Constant_303146" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5668" name="Constant_303147" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5669" name="Constant_303143" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5670" name="Constant_303142" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5671" name="ScatterUpdate_303148" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5672" name="Constant_303151" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5673" name="__module.model.gpt_neox.layers.24.attention/aten::slice/Slice_13" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="3990,3991"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="5674" name="__module.model.gpt_neox.layers.24.attention/aten::where/Convert_1" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="5675" name="__module.model.gpt_neox.layers.24.attention/aten::full/Convert" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="263462988" size="4" /> + <output> + <port id="0" precision="FP32" names="3978" /> + </output> + </layer> + <layer id="5676" name="__module.model.gpt_neox.layers.24.attention/aten::where/Select" type="Select" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32" /> + <port id="2" precision="FP32" /> + </input> + <output> + <port id="3" precision="FP32" names="3992,causal_mask.97"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="5677" name="Add_316716" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="5678" name="ShapeOf_316717" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5679" name="Constant_340180" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5680" name="Constant_340181" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5681" name="Gather_340182" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="3976"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5682" name="Constant_268201" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5683" name="Constant_268203" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5684" name="Constant_268205" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5685" name="__module.model.gpt_neox.layers.24.attention/prim::ListConstruct/Concat_1" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="3993"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5686" name="Maximum_316718" type="Maximum" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5687" name="__module.model.gpt_neox.layers.24.attention/aten::add/Add_2" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3995"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="5688" name="__module.model.gpt_neox.layers.24.attention/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3996,3997,sdpa_result.49,tensor.97"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5689" name="Constant_14635" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="3998"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5690" name="__module.model.gpt_neox.layers.24.attention/aten::permute/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3999"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5691" name="__module.model.gpt_neox.layers.24.attention/prim::ListConstruct/Concat_2" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263463020" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="5692" name="__module.model.gpt_neox.layers.24.attention/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4004"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5693" name="self.model.gpt_neox.layers.24.attention.dense.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 4096" offset="5103067268" size="16777216" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5694" name="Convert_449922" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5695" name="self.model.gpt_neox.layers.24.attention.dense.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="5119844484" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5696" name="Convert_449925" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5697" name="self.model.gpt_neox.layers.24.attention.dense.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5698" name="self.model.gpt_neox.layers.24.attention.dense.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="5119848580" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5699" name="self.model.gpt_neox.layers.24.attention.dense.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5700" name="self.model.gpt_neox.layers.24.attention.dense.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5701" name="__module.model.gpt_neox.layers.24.attention.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5702" name="Constant_325436" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="5119856772" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5703" name="__module.model.gpt_neox.layers.24.attention.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4007,4009,input.99"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5704" name="__module.model.gpt_neox.layers.24/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4013,attn_output.99"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5705" name="__module.model.gpt_neox.layers.24.post_attention_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5706" name="__module.model.gpt_neox.layers.24.post_attention_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5707" name="Constant_325437" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="5119873156" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5708" name="__module.model.gpt_neox.layers.24.post_attention_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5709" name="Constant_325438" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="5119889540" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5710" name="__module.model.gpt_neox.layers.24.post_attention_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4017"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5711" name="self.model.gpt_neox.layers.24.mlp.dense_h_to_4h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 4096" offset="5119905924" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5712" name="Convert_449933" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5713" name="self.model.gpt_neox.layers.24.mlp.dense_h_to_4h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 1" offset="5187014788" size="16384" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5714" name="Convert_449936" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5715" name="self.model.gpt_neox.layers.24.mlp.dense_h_to_4h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5716" name="self.model.gpt_neox.layers.24.mlp.dense_h_to_4h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="16384, 1" offset="5187031172" size="32768" /> + <output> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5717" name="self.model.gpt_neox.layers.24.mlp.dense_h_to_4h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5718" name="self.model.gpt_neox.layers.24.mlp.dense_h_to_4h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5719" name="__module.model.gpt_neox.layers.24.mlp.dense_h_to_4h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="5720" name="Constant_325439" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 16384" offset="5187063940" size="65536" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="5721" name="__module.model.gpt_neox.layers.24.mlp.dense_h_to_4h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4022"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="5722" name="__module.model.gpt_neox.layers.24.mlp.act/aten::gelu/Gelu" type="Gelu" version="opset7"> + <data approximation_mode="ERF" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="4023"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="5723" name="self.model.gpt_neox.layers.24.mlp.dense_4h_to_h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 16384" offset="5187129476" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="5724" name="Convert_449944" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="5725" name="self.model.gpt_neox.layers.24.mlp.dense_4h_to_h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="5254238340" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5726" name="Convert_449947" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5727" name="self.model.gpt_neox.layers.24.mlp.dense_4h_to_h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="5728" name="self.model.gpt_neox.layers.24.mlp.dense_4h_to_h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="5254242436" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5729" name="self.model.gpt_neox.layers.24.mlp.dense_4h_to_h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="5730" name="self.model.gpt_neox.layers.24.mlp.dense_4h_to_h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="5731" name="__module.model.gpt_neox.layers.24.mlp.dense_4h_to_h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5732" name="Constant_325440" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="5254250628" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5733" name="__module.model.gpt_neox.layers.24.mlp.dense_4h_to_h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4026,input.101"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5734" name="__module.model.gpt_neox.layers.24/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4028,4030,hidden_states.51"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5735" name="__module.model.gpt_neox.layers.25.input_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5736" name="__module.model.gpt_neox.layers.25.input_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5737" name="Constant_325441" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="5254267012" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5738" name="__module.model.gpt_neox.layers.25.input_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5739" name="Constant_325442" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="5254283396" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5740" name="__module.model.gpt_neox.layers.25.input_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4040"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5741" name="self.model.gpt_neox.layers.25.attention.query_key_value.weight" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 4096" offset="5254299780" size="50331648" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5742" name="Convert_449955" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5743" name="self.model.gpt_neox.layers.25.attention.query_key_value.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 1" offset="5304631428" size="12288" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5744" name="Convert_449958" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5745" name="self.model.gpt_neox.layers.25.attention.query_key_value.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5746" name="self.model.gpt_neox.layers.25.attention.query_key_value.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="12288, 1" offset="5304643716" size="24576" /> + <output> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5747" name="self.model.gpt_neox.layers.25.attention.query_key_value.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5748" name="self.model.gpt_neox.layers.25.attention.query_key_value.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5749" name="__module.model.gpt_neox.layers.25.attention.query_key_value/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="5750" name="Constant_325443" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 12288" offset="5304668292" size="49152" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="5751" name="__module.model.gpt_neox.layers.25.attention.query_key_value/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4047,qkv.101"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="5752" name="__module.model.gpt_neox.layers.25.attention/prim::ListConstruct/Concat" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171232" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5753" name="__module.model.gpt_neox.layers.25.attention/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4051,qkv.103"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + </output> + </layer> + <layer id="5754" name="Constant_303158" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5755" name="Constant_303161" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5756" name="Constant_303164" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5757" name="__module.model.gpt_neox.layers.25.attention/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4052"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5758" name="Constant_14747" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="4053"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5759" name="__module.model.gpt_neox.layers.25.attention/aten::permute/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4054,query.151"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5760" name="Constant_303170" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5761" name="Constant_303173" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5762" name="Constant_303176" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5763" name="__module.model.gpt_neox.layers.25.attention/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4061,q.51"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5764" name="self.model.gpt_neox.layers.25.attention.rotary_emb.cos_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="257171392" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.25.attention.rotary_emb.cos_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5765" name="__module.model.gpt_neox.layers.25.attention.rotary_emb/aten::slice/Unsqueeze" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5766" name="Constant_303182" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5767" name="Constant_303185" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5768" name="Constant_303188" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5769" name="__module.model.gpt_neox.layers.25.attention/aten::slice/Slice_2" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4055"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5770" name="ShapeOf_340184" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5771" name="Constant_341045" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5772" name="Constant_340186" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5773" name="Gather_340187" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="4065"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5774" name="Constant_433288" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="5775" name="Constant_433281" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5776" name="Constant_433283" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5777" name="Constant_433285" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5778" name="Concat_433286" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5779" name="Broadcast_433289" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5780" name="ReadValue_417354" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.25.keypresent.25.key" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.25.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5781" name="Constant_402040" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5782" name="Gather_402041" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5783" name="ShapeOf_340189" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5784" name="Constant_340190" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5785" name="Constant_340191" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5786" name="Gather_340192" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="4067" /> + </output> + </layer> + <layer id="5787" name="Constant_337834" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5788" name="Reshape_340955" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5789" name="__module.model.gpt_neox.layers.25.attention/aten::add_/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="4066,4070,4071,seq_len.101"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5790" name="__module.model.gpt_neox.layers.25.attention.rotary_emb/aten::slice/Unsqueeze_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5791" name="__module.model.gpt_neox.layers.25.attention.rotary_emb/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4074,4077,cos.101"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5792" name="Constant_38377" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="5793" name="__module.model.gpt_neox.layers.25.attention/aten::index/Gather" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="4080"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5794" name="__module.model.gpt_neox.layers.25.attention/aten::unsqueeze/Unsqueeze" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="4081,cos.103"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5795" name="__module.model.gpt_neox.layers.25.attention/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4085"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5796" name="Constant_303193" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5797" name="Constant_303192" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5798" name="__module.model.gpt_neox.layers.25.attention/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5799" name="__module.model.gpt_neox.layers.25.attention/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="5800" name="__module.model.gpt_neox.layers.25.attention/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="4086,4091" /> + </output> + </layer> + <layer id="5801" name="__module.model.gpt_neox.layers.25.attention/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="5802" name="__module.model.gpt_neox.layers.25.attention/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="4088,4089,4093,4094" /> + </output> + </layer> + <layer id="5803" name="Constant_337836" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5804" name="__module.model.gpt_neox.layers.25.attention/aten::slice/Unsqueeze_17" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5805" name="Constant_303191" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5806" name="ScatterUpdate_303194" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5807" name="Constant_303197" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5808" name="Constant_303200" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5809" name="__module.model.gpt_neox.layers.25.attention/aten::slice/Slice_3" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4095,x2.101"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="5810" name="Constant_325444" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5811" name="__module.model.gpt_neox.layers.25.attention/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4096"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="5812" name="Constant_303245" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5813" name="Constant_303250" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5814" name="__module.model.gpt_neox.layers.25.attention/aten::slice/Slice_4" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4090"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="5815" name="__module.model.gpt_neox.layers.25.attention/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4098"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5816" name="self.model.gpt_neox.layers.25.attention.rotary_emb.sin_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="258220060" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.25.attention.rotary_emb.sin_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5817" name="__module.model.gpt_neox.layers.25.attention.rotary_emb/aten::slice/Unsqueeze_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5818" name="__module.model.gpt_neox.layers.25.attention.rotary_emb/aten::slice/Unsqueeze_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5819" name="__module.model.gpt_neox.layers.25.attention.rotary_emb/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4075,4078,sin.101"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5820" name="Constant_38380" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="5821" name="__module.model.gpt_neox.layers.25.attention/aten::index/Gather_1" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="4083"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5822" name="__module.model.gpt_neox.layers.25.attention/aten::unsqueeze/Unsqueeze_1" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="4084,sin.103"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5823" name="__module.model.gpt_neox.layers.25.attention/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4099"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5824" name="__module.model.gpt_neox.layers.25.attention/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4100,4118,4128,query.153,query.155"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5825" name="Constant_14761" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="4056"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5826" name="__module.model.gpt_neox.layers.25.attention/aten::permute/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4057,key.151"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5827" name="Constant_303296" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5828" name="Constant_303299" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5829" name="Constant_303302" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5830" name="__module.model.gpt_neox.layers.25.attention/aten::slice/Slice_6" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4063,k.51"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5831" name="__module.model.gpt_neox.layers.25.attention/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4101"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5832" name="Constant_303306" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5833" name="Constant_303305" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5834" name="__module.model.gpt_neox.layers.25.attention/aten::size/ShapeOf_7" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5835" name="__module.model.gpt_neox.layers.25.attention/aten::size/Constant_7" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="5836" name="__module.model.gpt_neox.layers.25.attention/aten::size/Gather_7" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="4102,4107" /> + </output> + </layer> + <layer id="5837" name="__module.model.gpt_neox.layers.25.attention/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="5838" name="__module.model.gpt_neox.layers.25.attention/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="4104,4105,4109,4110" /> + </output> + </layer> + <layer id="5839" name="Constant_337838" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5840" name="__module.model.gpt_neox.layers.25.attention/aten::slice/Unsqueeze_33" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5841" name="Constant_303304" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5842" name="ScatterUpdate_303307" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5843" name="Constant_303310" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5844" name="Constant_303313" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5845" name="__module.model.gpt_neox.layers.25.attention/aten::slice/Slice_7" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4111,x2.103"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="5846" name="Constant_325445" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5847" name="__module.model.gpt_neox.layers.25.attention/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4112"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="5848" name="Constant_303358" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5849" name="Constant_303363" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5850" name="__module.model.gpt_neox.layers.25.attention/aten::slice/Slice_8" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4106"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="5851" name="__module.model.gpt_neox.layers.25.attention/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4114"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5852" name="__module.model.gpt_neox.layers.25.attention/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4115"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5853" name="__module.model.gpt_neox.layers.25.attention/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4116,4120"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5854" name="__module.model.gpt_neox.layers.25.attention/aten::to/Convert_1" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.25.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5855" name="Constant_433301" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="5856" name="Constant_433294" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5857" name="Constant_433296" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5858" name="Constant_433298" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5859" name="Concat_433299" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5860" name="Broadcast_433302" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5861" name="ReadValue_417356" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.25.valuepresent.25.value" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.25.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5862" name="Constant_402043" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5863" name="Gather_402044" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5864" name="Constant_303408" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5865" name="Constant_303411" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5866" name="Constant_303414" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5867" name="__module.model.gpt_neox.layers.25.attention/aten::slice/Slice_10" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4058"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5868" name="Constant_14775" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="4059"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5869" name="__module.model.gpt_neox.layers.25.attention/aten::permute/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4060"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5870" name="__module.model.gpt_neox.layers.25.attention/aten::cat/Concat_5" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.25.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5871" name="__module.model.gpt_neox.layers.25.attention/aten::slice/Slice_11" type="Const" version="opset1"> + <data element_type="boolean" shape="1, 1, 2048, 2048" offset="259268636" size="4194304" /> + <output> + <port id="0" precision="BOOL" names="4137"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="5872" name="Constant_303418" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="5873" name="Constant_303417" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5874" name="ShapeOf_340194" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5875" name="Constant_340195" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5876" name="Constant_340196" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5877" name="Gather_340197" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" /> + </output> + </layer> + <layer id="5878" name="Add_340198" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="4132" /> + </output> + </layer> + <layer id="5879" name="ShapeOf_340265" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5880" name="Constant_340266" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5881" name="Constant_340267" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5882" name="Gather_340268" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="4130" /> + </output> + </layer> + <layer id="5883" name="__module.model.gpt_neox.layers.25.attention/aten::sub/Subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="4134,4135" /> + </output> + </layer> + <layer id="5884" name="Constant_337840" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5885" name="__module.model.gpt_neox.layers.25.attention/aten::slice/Unsqueeze_44" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5886" name="Constant_303416" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5887" name="ScatterUpdate_303419" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="5888" name="Constant_303420" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="5889" name="Constant_337842" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5890" name="__module.model.gpt_neox.layers.25.attention/aten::slice/Unsqueeze_45" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5891" name="ScatterUpdate_303421" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="5892" name="Constant_303424" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462964" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="5893" name="__module.model.gpt_neox.layers.25.attention/aten::slice/Slice_12" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 0" end_mask="1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + <port id="2" precision="I64"> + <dim>3</dim> + </port> + <port id="3" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="4138"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="5894" name="Constant_303497" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5895" name="Constant_303498" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5896" name="Constant_303494" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5897" name="Constant_303493" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5898" name="ScatterUpdate_303499" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5899" name="Constant_303502" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5900" name="__module.model.gpt_neox.layers.25.attention/aten::slice/Slice_13" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="4139,4140"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="5901" name="__module.model.gpt_neox.layers.25.attention/aten::where/Convert_1" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="5902" name="__module.model.gpt_neox.layers.25.attention/aten::full/Convert" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="263462988" size="4" /> + <output> + <port id="0" precision="FP32" names="4127" /> + </output> + </layer> + <layer id="5903" name="__module.model.gpt_neox.layers.25.attention/aten::where/Select" type="Select" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32" /> + <port id="2" precision="FP32" /> + </input> + <output> + <port id="3" precision="FP32" names="4141,causal_mask.101"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="5904" name="Add_316788" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="5905" name="ShapeOf_316789" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5906" name="Constant_340271" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5907" name="Constant_340272" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5908" name="Gather_340273" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="4125"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5909" name="Constant_268211" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5910" name="Constant_268213" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5911" name="Constant_268215" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5912" name="__module.model.gpt_neox.layers.25.attention/prim::ListConstruct/Concat_1" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="4142"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5913" name="Maximum_316790" type="Maximum" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5914" name="__module.model.gpt_neox.layers.25.attention/aten::add/Add_2" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4144"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="5915" name="__module.model.gpt_neox.layers.25.attention/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4145,4146,sdpa_result.51,tensor.101"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5916" name="Constant_15216" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="4147"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5917" name="__module.model.gpt_neox.layers.25.attention/aten::permute/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4148"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5918" name="__module.model.gpt_neox.layers.25.attention/prim::ListConstruct/Concat_2" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263463020" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="5919" name="__module.model.gpt_neox.layers.25.attention/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4153"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5920" name="self.model.gpt_neox.layers.25.attention.dense.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 4096" offset="5304717444" size="16777216" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5921" name="Convert_449966" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5922" name="self.model.gpt_neox.layers.25.attention.dense.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="5321494660" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5923" name="Convert_449969" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5924" name="self.model.gpt_neox.layers.25.attention.dense.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5925" name="self.model.gpt_neox.layers.25.attention.dense.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="5321498756" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5926" name="self.model.gpt_neox.layers.25.attention.dense.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5927" name="self.model.gpt_neox.layers.25.attention.dense.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5928" name="__module.model.gpt_neox.layers.25.attention.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5929" name="Constant_325446" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="5321506948" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5930" name="__module.model.gpt_neox.layers.25.attention.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4156,4158,input.103"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5931" name="__module.model.gpt_neox.layers.25/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4162,attn_output.103"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5932" name="__module.model.gpt_neox.layers.25.post_attention_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5933" name="__module.model.gpt_neox.layers.25.post_attention_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5934" name="Constant_325447" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="5321523332" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5935" name="__module.model.gpt_neox.layers.25.post_attention_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5936" name="Constant_325448" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="5321539716" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5937" name="__module.model.gpt_neox.layers.25.post_attention_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4166"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5938" name="self.model.gpt_neox.layers.25.mlp.dense_h_to_4h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 4096" offset="5321556100" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5939" name="Convert_449977" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5940" name="self.model.gpt_neox.layers.25.mlp.dense_h_to_4h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 1" offset="5388664964" size="16384" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5941" name="Convert_449980" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5942" name="self.model.gpt_neox.layers.25.mlp.dense_h_to_4h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5943" name="self.model.gpt_neox.layers.25.mlp.dense_h_to_4h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="16384, 1" offset="5388681348" size="32768" /> + <output> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5944" name="self.model.gpt_neox.layers.25.mlp.dense_h_to_4h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5945" name="self.model.gpt_neox.layers.25.mlp.dense_h_to_4h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5946" name="__module.model.gpt_neox.layers.25.mlp.dense_h_to_4h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="5947" name="Constant_325449" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 16384" offset="5388714116" size="65536" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="5948" name="__module.model.gpt_neox.layers.25.mlp.dense_h_to_4h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4171"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="5949" name="__module.model.gpt_neox.layers.25.mlp.act/aten::gelu/Gelu" type="Gelu" version="opset7"> + <data approximation_mode="ERF" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="4172"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="5950" name="self.model.gpt_neox.layers.25.mlp.dense_4h_to_h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 16384" offset="5388779652" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="5951" name="Convert_449988" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="5952" name="self.model.gpt_neox.layers.25.mlp.dense_4h_to_h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="5455888516" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5953" name="Convert_449991" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5954" name="self.model.gpt_neox.layers.25.mlp.dense_4h_to_h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="5955" name="self.model.gpt_neox.layers.25.mlp.dense_4h_to_h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="5455892612" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5956" name="self.model.gpt_neox.layers.25.mlp.dense_4h_to_h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="5957" name="self.model.gpt_neox.layers.25.mlp.dense_4h_to_h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="5958" name="__module.model.gpt_neox.layers.25.mlp.dense_4h_to_h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5959" name="Constant_325450" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="5455900804" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5960" name="__module.model.gpt_neox.layers.25.mlp.dense_4h_to_h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4175,input.105"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5961" name="__module.model.gpt_neox.layers.25/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4177,4179,hidden_states.53"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5962" name="__module.model.gpt_neox.layers.26.input_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5963" name="__module.model.gpt_neox.layers.26.input_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5964" name="Constant_325451" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="5455917188" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5965" name="__module.model.gpt_neox.layers.26.input_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5966" name="Constant_325452" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="5455933572" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5967" name="__module.model.gpt_neox.layers.26.input_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4189"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5968" name="self.model.gpt_neox.layers.26.attention.query_key_value.weight" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 4096" offset="5455949956" size="50331648" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5969" name="Convert_449999" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5970" name="self.model.gpt_neox.layers.26.attention.query_key_value.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 1" offset="5506281604" size="12288" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5971" name="Convert_450002" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5972" name="self.model.gpt_neox.layers.26.attention.query_key_value.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5973" name="self.model.gpt_neox.layers.26.attention.query_key_value.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="12288, 1" offset="5506293892" size="24576" /> + <output> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5974" name="self.model.gpt_neox.layers.26.attention.query_key_value.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5975" name="self.model.gpt_neox.layers.26.attention.query_key_value.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="5976" name="__module.model.gpt_neox.layers.26.attention.query_key_value/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="5977" name="Constant_325453" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 12288" offset="5506318468" size="49152" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="5978" name="__module.model.gpt_neox.layers.26.attention.query_key_value/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4196,qkv.105"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="5979" name="__module.model.gpt_neox.layers.26.attention/prim::ListConstruct/Concat" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171232" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5980" name="__module.model.gpt_neox.layers.26.attention/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4200,qkv.107"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + </output> + </layer> + <layer id="5981" name="Constant_303509" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5982" name="Constant_303512" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5983" name="Constant_303515" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5984" name="__module.model.gpt_neox.layers.26.attention/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4201"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5985" name="Constant_15328" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="4202"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5986" name="__module.model.gpt_neox.layers.26.attention/aten::permute/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4203,query.157"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5987" name="Constant_303521" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5988" name="Constant_303524" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5989" name="Constant_303527" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5990" name="__module.model.gpt_neox.layers.26.attention/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4210,q.53"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5991" name="self.model.gpt_neox.layers.26.attention.rotary_emb.cos_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="257171392" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.26.attention.rotary_emb.cos_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5992" name="__module.model.gpt_neox.layers.26.attention.rotary_emb/aten::slice/Unsqueeze" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5993" name="Constant_303533" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5994" name="Constant_303536" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5995" name="Constant_303539" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5996" name="__module.model.gpt_neox.layers.26.attention/aten::slice/Slice_2" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4204"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5997" name="ShapeOf_340275" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5998" name="Constant_341048" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5999" name="Constant_340277" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6000" name="Gather_340278" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="4214"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6001" name="Constant_433314" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="6002" name="Constant_433307" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6003" name="Constant_433309" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6004" name="Constant_433311" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6005" name="Concat_433312" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6006" name="Broadcast_433315" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6007" name="ReadValue_417358" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.26.keypresent.26.key" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.26.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6008" name="Constant_402046" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6009" name="Gather_402047" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6010" name="ShapeOf_340280" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6011" name="Constant_340281" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6012" name="Constant_340282" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6013" name="Gather_340283" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="4216" /> + </output> + </layer> + <layer id="6014" name="Constant_337844" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6015" name="Reshape_340957" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6016" name="__module.model.gpt_neox.layers.26.attention/aten::add_/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="4215,4219,4220,seq_len.105"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6017" name="__module.model.gpt_neox.layers.26.attention.rotary_emb/aten::slice/Unsqueeze_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6018" name="__module.model.gpt_neox.layers.26.attention.rotary_emb/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4223,4226,cos.105"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6019" name="Constant_38383" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="6020" name="__module.model.gpt_neox.layers.26.attention/aten::index/Gather" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="4229"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6021" name="__module.model.gpt_neox.layers.26.attention/aten::unsqueeze/Unsqueeze" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="4230,cos.107"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6022" name="__module.model.gpt_neox.layers.26.attention/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4234"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6023" name="Constant_303544" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6024" name="Constant_303543" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6025" name="__module.model.gpt_neox.layers.26.attention/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6026" name="__module.model.gpt_neox.layers.26.attention/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="6027" name="__module.model.gpt_neox.layers.26.attention/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="4235,4240" /> + </output> + </layer> + <layer id="6028" name="__module.model.gpt_neox.layers.26.attention/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="6029" name="__module.model.gpt_neox.layers.26.attention/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="4237,4238,4242,4243" /> + </output> + </layer> + <layer id="6030" name="Constant_337846" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6031" name="__module.model.gpt_neox.layers.26.attention/aten::slice/Unsqueeze_17" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6032" name="Constant_303542" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6033" name="ScatterUpdate_303545" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6034" name="Constant_303548" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6035" name="Constant_303551" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6036" name="__module.model.gpt_neox.layers.26.attention/aten::slice/Slice_3" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4244,x2.105"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="6037" name="Constant_325454" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6038" name="__module.model.gpt_neox.layers.26.attention/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4245"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="6039" name="Constant_303596" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6040" name="Constant_303601" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6041" name="__module.model.gpt_neox.layers.26.attention/aten::slice/Slice_4" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4239"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="6042" name="__module.model.gpt_neox.layers.26.attention/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4247"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6043" name="self.model.gpt_neox.layers.26.attention.rotary_emb.sin_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="258220060" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.26.attention.rotary_emb.sin_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6044" name="__module.model.gpt_neox.layers.26.attention.rotary_emb/aten::slice/Unsqueeze_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6045" name="__module.model.gpt_neox.layers.26.attention.rotary_emb/aten::slice/Unsqueeze_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6046" name="__module.model.gpt_neox.layers.26.attention.rotary_emb/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4224,4227,sin.105"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6047" name="Constant_38386" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="6048" name="__module.model.gpt_neox.layers.26.attention/aten::index/Gather_1" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="4232"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6049" name="__module.model.gpt_neox.layers.26.attention/aten::unsqueeze/Unsqueeze_1" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="4233,sin.107"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6050" name="__module.model.gpt_neox.layers.26.attention/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4248"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6051" name="__module.model.gpt_neox.layers.26.attention/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4249,4267,4277,query.159,query.161"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6052" name="Constant_15342" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="4205"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6053" name="__module.model.gpt_neox.layers.26.attention/aten::permute/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4206,key.157"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6054" name="Constant_303647" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6055" name="Constant_303650" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6056" name="Constant_303653" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6057" name="__module.model.gpt_neox.layers.26.attention/aten::slice/Slice_6" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4212,k.53"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6058" name="__module.model.gpt_neox.layers.26.attention/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4250"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6059" name="Constant_303657" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6060" name="Constant_303656" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6061" name="__module.model.gpt_neox.layers.26.attention/aten::size/ShapeOf_7" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6062" name="__module.model.gpt_neox.layers.26.attention/aten::size/Constant_7" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="6063" name="__module.model.gpt_neox.layers.26.attention/aten::size/Gather_7" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="4251,4256" /> + </output> + </layer> + <layer id="6064" name="__module.model.gpt_neox.layers.26.attention/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="6065" name="__module.model.gpt_neox.layers.26.attention/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="4253,4254,4258,4259" /> + </output> + </layer> + <layer id="6066" name="Constant_337848" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6067" name="__module.model.gpt_neox.layers.26.attention/aten::slice/Unsqueeze_33" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6068" name="Constant_303655" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6069" name="ScatterUpdate_303658" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6070" name="Constant_303661" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6071" name="Constant_303664" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6072" name="__module.model.gpt_neox.layers.26.attention/aten::slice/Slice_7" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4260,x2.107"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="6073" name="Constant_325455" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6074" name="__module.model.gpt_neox.layers.26.attention/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4261"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="6075" name="Constant_303709" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6076" name="Constant_303714" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6077" name="__module.model.gpt_neox.layers.26.attention/aten::slice/Slice_8" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4255"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="6078" name="__module.model.gpt_neox.layers.26.attention/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4263"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6079" name="__module.model.gpt_neox.layers.26.attention/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4264"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6080" name="__module.model.gpt_neox.layers.26.attention/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4265,4269"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6081" name="__module.model.gpt_neox.layers.26.attention/aten::to/Convert_1" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.26.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6082" name="Constant_433327" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="6083" name="Constant_433320" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6084" name="Constant_433322" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6085" name="Constant_433324" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6086" name="Concat_433325" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6087" name="Broadcast_433328" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6088" name="ReadValue_417360" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.26.valuepresent.26.value" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.26.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6089" name="Constant_402049" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6090" name="Gather_402050" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6091" name="Constant_303759" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6092" name="Constant_303762" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6093" name="Constant_303765" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6094" name="__module.model.gpt_neox.layers.26.attention/aten::slice/Slice_10" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4207"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6095" name="Constant_15356" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="4208"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6096" name="__module.model.gpt_neox.layers.26.attention/aten::permute/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4209"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6097" name="__module.model.gpt_neox.layers.26.attention/aten::cat/Concat_5" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.26.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6098" name="__module.model.gpt_neox.layers.26.attention/aten::slice/Slice_11" type="Const" version="opset1"> + <data element_type="boolean" shape="1, 1, 2048, 2048" offset="259268636" size="4194304" /> + <output> + <port id="0" precision="BOOL" names="4286"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="6099" name="Constant_303769" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="6100" name="Constant_303768" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6101" name="ShapeOf_340285" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6102" name="Constant_340286" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6103" name="Constant_340287" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6104" name="Gather_340288" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" /> + </output> + </layer> + <layer id="6105" name="Add_340289" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="4281" /> + </output> + </layer> + <layer id="6106" name="ShapeOf_340356" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6107" name="Constant_340357" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6108" name="Constant_340358" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6109" name="Gather_340359" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="4279" /> + </output> + </layer> + <layer id="6110" name="__module.model.gpt_neox.layers.26.attention/aten::sub/Subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="4283,4284" /> + </output> + </layer> + <layer id="6111" name="Constant_337850" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6112" name="__module.model.gpt_neox.layers.26.attention/aten::slice/Unsqueeze_44" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6113" name="Constant_303767" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6114" name="ScatterUpdate_303770" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="6115" name="Constant_303771" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="6116" name="Constant_337852" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6117" name="__module.model.gpt_neox.layers.26.attention/aten::slice/Unsqueeze_45" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6118" name="ScatterUpdate_303772" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="6119" name="Constant_303775" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462964" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="6120" name="__module.model.gpt_neox.layers.26.attention/aten::slice/Slice_12" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 0" end_mask="1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + <port id="2" precision="I64"> + <dim>3</dim> + </port> + <port id="3" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="4287"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="6121" name="Constant_303848" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6122" name="Constant_303849" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6123" name="Constant_303845" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6124" name="Constant_303844" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6125" name="ScatterUpdate_303850" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6126" name="Constant_303853" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6127" name="__module.model.gpt_neox.layers.26.attention/aten::slice/Slice_13" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="4288,4289"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="6128" name="__module.model.gpt_neox.layers.26.attention/aten::where/Convert_1" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="6129" name="__module.model.gpt_neox.layers.26.attention/aten::full/Convert" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="263462988" size="4" /> + <output> + <port id="0" precision="FP32" names="4276" /> + </output> + </layer> + <layer id="6130" name="__module.model.gpt_neox.layers.26.attention/aten::where/Select" type="Select" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32" /> + <port id="2" precision="FP32" /> + </input> + <output> + <port id="3" precision="FP32" names="4290,causal_mask.105"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="6131" name="Add_316860" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="6132" name="ShapeOf_316861" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6133" name="Constant_340362" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6134" name="Constant_340363" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6135" name="Gather_340364" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="4274"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6136" name="Constant_268221" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6137" name="Constant_268223" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6138" name="Constant_268225" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6139" name="__module.model.gpt_neox.layers.26.attention/prim::ListConstruct/Concat_1" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="4291"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6140" name="Maximum_316862" type="Maximum" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6141" name="__module.model.gpt_neox.layers.26.attention/aten::add/Add_2" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4293"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="6142" name="__module.model.gpt_neox.layers.26.attention/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4294,4295,sdpa_result.53,tensor.105"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6143" name="Constant_15797" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="4296"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6144" name="__module.model.gpt_neox.layers.26.attention/aten::permute/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4297"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6145" name="__module.model.gpt_neox.layers.26.attention/prim::ListConstruct/Concat_2" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263463020" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="6146" name="__module.model.gpt_neox.layers.26.attention/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4302"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6147" name="self.model.gpt_neox.layers.26.attention.dense.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 4096" offset="5506367620" size="16777216" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6148" name="Convert_450010" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6149" name="self.model.gpt_neox.layers.26.attention.dense.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="5523144836" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6150" name="Convert_450013" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6151" name="self.model.gpt_neox.layers.26.attention.dense.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6152" name="self.model.gpt_neox.layers.26.attention.dense.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="5523148932" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6153" name="self.model.gpt_neox.layers.26.attention.dense.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6154" name="self.model.gpt_neox.layers.26.attention.dense.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6155" name="__module.model.gpt_neox.layers.26.attention.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6156" name="Constant_325456" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="5523157124" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6157" name="__module.model.gpt_neox.layers.26.attention.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4305,4307,input.107"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6158" name="__module.model.gpt_neox.layers.26/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4311,attn_output.107"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6159" name="__module.model.gpt_neox.layers.26.post_attention_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6160" name="__module.model.gpt_neox.layers.26.post_attention_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6161" name="Constant_325457" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="5523173508" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6162" name="__module.model.gpt_neox.layers.26.post_attention_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6163" name="Constant_325458" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="5523189892" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6164" name="__module.model.gpt_neox.layers.26.post_attention_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4315"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6165" name="self.model.gpt_neox.layers.26.mlp.dense_h_to_4h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 4096" offset="5523206276" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6166" name="Convert_450021" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6167" name="self.model.gpt_neox.layers.26.mlp.dense_h_to_4h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 1" offset="5590315140" size="16384" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6168" name="Convert_450024" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6169" name="self.model.gpt_neox.layers.26.mlp.dense_h_to_4h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6170" name="self.model.gpt_neox.layers.26.mlp.dense_h_to_4h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="16384, 1" offset="5590331524" size="32768" /> + <output> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6171" name="self.model.gpt_neox.layers.26.mlp.dense_h_to_4h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6172" name="self.model.gpt_neox.layers.26.mlp.dense_h_to_4h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6173" name="__module.model.gpt_neox.layers.26.mlp.dense_h_to_4h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="6174" name="Constant_325459" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 16384" offset="5590364292" size="65536" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="6175" name="__module.model.gpt_neox.layers.26.mlp.dense_h_to_4h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4320"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="6176" name="__module.model.gpt_neox.layers.26.mlp.act/aten::gelu/Gelu" type="Gelu" version="opset7"> + <data approximation_mode="ERF" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="4321"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="6177" name="self.model.gpt_neox.layers.26.mlp.dense_4h_to_h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 16384" offset="5590429828" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="6178" name="Convert_450032" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="6179" name="self.model.gpt_neox.layers.26.mlp.dense_4h_to_h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="5657538692" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6180" name="Convert_450035" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6181" name="self.model.gpt_neox.layers.26.mlp.dense_4h_to_h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="6182" name="self.model.gpt_neox.layers.26.mlp.dense_4h_to_h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="5657542788" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6183" name="self.model.gpt_neox.layers.26.mlp.dense_4h_to_h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="6184" name="self.model.gpt_neox.layers.26.mlp.dense_4h_to_h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="6185" name="__module.model.gpt_neox.layers.26.mlp.dense_4h_to_h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6186" name="Constant_325460" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="5657550980" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6187" name="__module.model.gpt_neox.layers.26.mlp.dense_4h_to_h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4324,input.109"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6188" name="__module.model.gpt_neox.layers.26/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4326,4328,hidden_states.55"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6189" name="__module.model.gpt_neox.layers.27.input_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6190" name="__module.model.gpt_neox.layers.27.input_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6191" name="Constant_325461" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="5657567364" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6192" name="__module.model.gpt_neox.layers.27.input_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6193" name="Constant_325462" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="5657583748" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6194" name="__module.model.gpt_neox.layers.27.input_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4338"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6195" name="self.model.gpt_neox.layers.27.attention.query_key_value.weight" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 4096" offset="5657600132" size="50331648" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6196" name="Convert_450043" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6197" name="self.model.gpt_neox.layers.27.attention.query_key_value.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 1" offset="5707931780" size="12288" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6198" name="Convert_450046" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6199" name="self.model.gpt_neox.layers.27.attention.query_key_value.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6200" name="self.model.gpt_neox.layers.27.attention.query_key_value.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="12288, 1" offset="5707944068" size="24576" /> + <output> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6201" name="self.model.gpt_neox.layers.27.attention.query_key_value.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6202" name="self.model.gpt_neox.layers.27.attention.query_key_value.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6203" name="__module.model.gpt_neox.layers.27.attention.query_key_value/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="6204" name="Constant_325463" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 12288" offset="5707968644" size="49152" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="6205" name="__module.model.gpt_neox.layers.27.attention.query_key_value/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4345,qkv.109"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="6206" name="__module.model.gpt_neox.layers.27.attention/prim::ListConstruct/Concat" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171232" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6207" name="__module.model.gpt_neox.layers.27.attention/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4349,qkv.111"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + </output> + </layer> + <layer id="6208" name="Constant_303860" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6209" name="Constant_303863" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6210" name="Constant_303866" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6211" name="__module.model.gpt_neox.layers.27.attention/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4350"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6212" name="Constant_15909" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="4351"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6213" name="__module.model.gpt_neox.layers.27.attention/aten::permute/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4352,query.163"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6214" name="Constant_303872" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6215" name="Constant_303875" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6216" name="Constant_303878" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6217" name="__module.model.gpt_neox.layers.27.attention/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4359,q.55"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6218" name="self.model.gpt_neox.layers.27.attention.rotary_emb.cos_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="257171392" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.27.attention.rotary_emb.cos_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6219" name="__module.model.gpt_neox.layers.27.attention.rotary_emb/aten::slice/Unsqueeze" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6220" name="Constant_303884" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6221" name="Constant_303887" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6222" name="Constant_303890" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6223" name="__module.model.gpt_neox.layers.27.attention/aten::slice/Slice_2" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4353"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6224" name="ShapeOf_340366" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6225" name="Constant_341051" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6226" name="Constant_340368" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6227" name="Gather_340369" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="4363"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6228" name="Constant_433340" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="6229" name="Constant_433333" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6230" name="Constant_433335" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6231" name="Constant_433337" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6232" name="Concat_433338" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6233" name="Broadcast_433341" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6234" name="ReadValue_417362" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.27.keypresent.27.key" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.27.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6235" name="Constant_402052" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6236" name="Gather_402053" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6237" name="ShapeOf_340371" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6238" name="Constant_340372" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6239" name="Constant_340373" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6240" name="Gather_340374" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="4365" /> + </output> + </layer> + <layer id="6241" name="Constant_337854" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6242" name="Reshape_340959" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6243" name="__module.model.gpt_neox.layers.27.attention/aten::add_/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="4364,4368,4369,seq_len.109"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6244" name="__module.model.gpt_neox.layers.27.attention.rotary_emb/aten::slice/Unsqueeze_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6245" name="__module.model.gpt_neox.layers.27.attention.rotary_emb/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4372,4375,cos.109"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6246" name="Constant_38389" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="6247" name="__module.model.gpt_neox.layers.27.attention/aten::index/Gather" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="4378"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6248" name="__module.model.gpt_neox.layers.27.attention/aten::unsqueeze/Unsqueeze" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="4379,cos.111"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6249" name="__module.model.gpt_neox.layers.27.attention/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4383"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6250" name="Constant_303895" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6251" name="Constant_303894" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6252" name="__module.model.gpt_neox.layers.27.attention/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6253" name="__module.model.gpt_neox.layers.27.attention/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="6254" name="__module.model.gpt_neox.layers.27.attention/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="4384,4389" /> + </output> + </layer> + <layer id="6255" name="__module.model.gpt_neox.layers.27.attention/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="6256" name="__module.model.gpt_neox.layers.27.attention/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="4386,4387,4391,4392" /> + </output> + </layer> + <layer id="6257" name="Constant_337856" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6258" name="__module.model.gpt_neox.layers.27.attention/aten::slice/Unsqueeze_17" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6259" name="Constant_303893" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6260" name="ScatterUpdate_303896" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6261" name="Constant_303899" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6262" name="Constant_303902" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6263" name="__module.model.gpt_neox.layers.27.attention/aten::slice/Slice_3" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4393,x2.109"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="6264" name="Constant_325464" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6265" name="__module.model.gpt_neox.layers.27.attention/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4394"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="6266" name="Constant_303947" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6267" name="Constant_303952" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6268" name="__module.model.gpt_neox.layers.27.attention/aten::slice/Slice_4" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4388"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="6269" name="__module.model.gpt_neox.layers.27.attention/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4396"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6270" name="self.model.gpt_neox.layers.27.attention.rotary_emb.sin_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="258220060" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.27.attention.rotary_emb.sin_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6271" name="__module.model.gpt_neox.layers.27.attention.rotary_emb/aten::slice/Unsqueeze_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6272" name="__module.model.gpt_neox.layers.27.attention.rotary_emb/aten::slice/Unsqueeze_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6273" name="__module.model.gpt_neox.layers.27.attention.rotary_emb/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4373,4376,sin.109"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6274" name="Constant_38392" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="6275" name="__module.model.gpt_neox.layers.27.attention/aten::index/Gather_1" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="4381"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6276" name="__module.model.gpt_neox.layers.27.attention/aten::unsqueeze/Unsqueeze_1" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="4382,sin.111"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6277" name="__module.model.gpt_neox.layers.27.attention/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4397"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6278" name="__module.model.gpt_neox.layers.27.attention/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4398,4416,4426,query.165,query.167"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6279" name="Constant_15923" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="4354"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6280" name="__module.model.gpt_neox.layers.27.attention/aten::permute/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4355,key.163"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6281" name="Constant_303998" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6282" name="Constant_304001" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6283" name="Constant_304004" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6284" name="__module.model.gpt_neox.layers.27.attention/aten::slice/Slice_6" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4361,k.55"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6285" name="__module.model.gpt_neox.layers.27.attention/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4399"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6286" name="Constant_304008" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6287" name="Constant_304007" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6288" name="__module.model.gpt_neox.layers.27.attention/aten::size/ShapeOf_7" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6289" name="__module.model.gpt_neox.layers.27.attention/aten::size/Constant_7" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="6290" name="__module.model.gpt_neox.layers.27.attention/aten::size/Gather_7" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="4400,4405" /> + </output> + </layer> + <layer id="6291" name="__module.model.gpt_neox.layers.27.attention/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="6292" name="__module.model.gpt_neox.layers.27.attention/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="4402,4403,4407,4408" /> + </output> + </layer> + <layer id="6293" name="Constant_337858" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6294" name="__module.model.gpt_neox.layers.27.attention/aten::slice/Unsqueeze_33" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6295" name="Constant_304006" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6296" name="ScatterUpdate_304009" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6297" name="Constant_304012" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6298" name="Constant_304015" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6299" name="__module.model.gpt_neox.layers.27.attention/aten::slice/Slice_7" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4409,x2.111"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="6300" name="Constant_325465" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6301" name="__module.model.gpt_neox.layers.27.attention/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4410"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="6302" name="Constant_304060" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6303" name="Constant_304065" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6304" name="__module.model.gpt_neox.layers.27.attention/aten::slice/Slice_8" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4404"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="6305" name="__module.model.gpt_neox.layers.27.attention/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4412"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6306" name="__module.model.gpt_neox.layers.27.attention/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4413"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6307" name="__module.model.gpt_neox.layers.27.attention/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4414,4418"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6308" name="__module.model.gpt_neox.layers.27.attention/aten::to/Convert_1" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.27.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6309" name="Constant_433353" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="6310" name="Constant_433346" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6311" name="Constant_433348" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6312" name="Constant_433350" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6313" name="Concat_433351" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6314" name="Broadcast_433354" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6315" name="ReadValue_417364" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.27.valuepresent.27.value" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.27.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6316" name="Constant_402055" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6317" name="Gather_402056" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6318" name="Constant_304110" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6319" name="Constant_304113" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6320" name="Constant_304116" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6321" name="__module.model.gpt_neox.layers.27.attention/aten::slice/Slice_10" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4356"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6322" name="Constant_15937" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="4357"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6323" name="__module.model.gpt_neox.layers.27.attention/aten::permute/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4358"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6324" name="__module.model.gpt_neox.layers.27.attention/aten::cat/Concat_5" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.27.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6325" name="__module.model.gpt_neox.layers.27.attention/aten::slice/Slice_11" type="Const" version="opset1"> + <data element_type="boolean" shape="1, 1, 2048, 2048" offset="259268636" size="4194304" /> + <output> + <port id="0" precision="BOOL" names="4435"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="6326" name="Constant_304120" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="6327" name="Constant_304119" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6328" name="ShapeOf_340376" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6329" name="Constant_340377" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6330" name="Constant_340378" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6331" name="Gather_340379" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" /> + </output> + </layer> + <layer id="6332" name="Add_340380" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="4430" /> + </output> + </layer> + <layer id="6333" name="ShapeOf_340447" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6334" name="Constant_340448" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6335" name="Constant_340449" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6336" name="Gather_340450" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="4428" /> + </output> + </layer> + <layer id="6337" name="__module.model.gpt_neox.layers.27.attention/aten::sub/Subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="4432,4433" /> + </output> + </layer> + <layer id="6338" name="Constant_337860" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6339" name="__module.model.gpt_neox.layers.27.attention/aten::slice/Unsqueeze_44" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6340" name="Constant_304118" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6341" name="ScatterUpdate_304121" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="6342" name="Constant_304122" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="6343" name="Constant_337862" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6344" name="__module.model.gpt_neox.layers.27.attention/aten::slice/Unsqueeze_45" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6345" name="ScatterUpdate_304123" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="6346" name="Constant_304126" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462964" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="6347" name="__module.model.gpt_neox.layers.27.attention/aten::slice/Slice_12" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 0" end_mask="1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + <port id="2" precision="I64"> + <dim>3</dim> + </port> + <port id="3" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="4436"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="6348" name="Constant_304199" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6349" name="Constant_304200" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6350" name="Constant_304196" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6351" name="Constant_304195" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6352" name="ScatterUpdate_304201" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6353" name="Constant_304204" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6354" name="__module.model.gpt_neox.layers.27.attention/aten::slice/Slice_13" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="4437,4438"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="6355" name="__module.model.gpt_neox.layers.27.attention/aten::where/Convert_1" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="6356" name="__module.model.gpt_neox.layers.27.attention/aten::full/Convert" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="263462988" size="4" /> + <output> + <port id="0" precision="FP32" names="4425" /> + </output> + </layer> + <layer id="6357" name="__module.model.gpt_neox.layers.27.attention/aten::where/Select" type="Select" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32" /> + <port id="2" precision="FP32" /> + </input> + <output> + <port id="3" precision="FP32" names="4439,causal_mask.109"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="6358" name="Add_316932" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="6359" name="ShapeOf_316933" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6360" name="Constant_340453" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6361" name="Constant_340454" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6362" name="Gather_340455" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="4423"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6363" name="Constant_268231" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6364" name="Constant_268233" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6365" name="Constant_268235" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6366" name="__module.model.gpt_neox.layers.27.attention/prim::ListConstruct/Concat_1" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="4440"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6367" name="Maximum_316934" type="Maximum" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6368" name="__module.model.gpt_neox.layers.27.attention/aten::add/Add_2" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4442"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="6369" name="__module.model.gpt_neox.layers.27.attention/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4443,4444,sdpa_result.55,tensor.109"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6370" name="Constant_16378" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="4445"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6371" name="__module.model.gpt_neox.layers.27.attention/aten::permute/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4446"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6372" name="__module.model.gpt_neox.layers.27.attention/prim::ListConstruct/Concat_2" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263463020" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="6373" name="__module.model.gpt_neox.layers.27.attention/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4451"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6374" name="self.model.gpt_neox.layers.27.attention.dense.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 4096" offset="5708017796" size="16777216" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6375" name="Convert_450054" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6376" name="self.model.gpt_neox.layers.27.attention.dense.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="5724795012" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6377" name="Convert_450057" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6378" name="self.model.gpt_neox.layers.27.attention.dense.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6379" name="self.model.gpt_neox.layers.27.attention.dense.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="5724799108" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6380" name="self.model.gpt_neox.layers.27.attention.dense.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6381" name="self.model.gpt_neox.layers.27.attention.dense.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6382" name="__module.model.gpt_neox.layers.27.attention.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6383" name="Constant_325466" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="5724807300" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6384" name="__module.model.gpt_neox.layers.27.attention.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4454,4456,input.111"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6385" name="__module.model.gpt_neox.layers.27/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4460,attn_output.111"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6386" name="__module.model.gpt_neox.layers.27.post_attention_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6387" name="__module.model.gpt_neox.layers.27.post_attention_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6388" name="Constant_325467" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="5724823684" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6389" name="__module.model.gpt_neox.layers.27.post_attention_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6390" name="Constant_325468" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="5724840068" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6391" name="__module.model.gpt_neox.layers.27.post_attention_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4464"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6392" name="self.model.gpt_neox.layers.27.mlp.dense_h_to_4h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 4096" offset="5724856452" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6393" name="Convert_450065" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6394" name="self.model.gpt_neox.layers.27.mlp.dense_h_to_4h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 1" offset="5791965316" size="16384" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6395" name="Convert_450068" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6396" name="self.model.gpt_neox.layers.27.mlp.dense_h_to_4h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6397" name="self.model.gpt_neox.layers.27.mlp.dense_h_to_4h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="16384, 1" offset="5791981700" size="32768" /> + <output> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6398" name="self.model.gpt_neox.layers.27.mlp.dense_h_to_4h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6399" name="self.model.gpt_neox.layers.27.mlp.dense_h_to_4h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6400" name="__module.model.gpt_neox.layers.27.mlp.dense_h_to_4h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="6401" name="Constant_325469" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 16384" offset="5792014468" size="65536" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="6402" name="__module.model.gpt_neox.layers.27.mlp.dense_h_to_4h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4469"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="6403" name="__module.model.gpt_neox.layers.27.mlp.act/aten::gelu/Gelu" type="Gelu" version="opset7"> + <data approximation_mode="ERF" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="4470"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="6404" name="self.model.gpt_neox.layers.27.mlp.dense_4h_to_h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 16384" offset="5792080004" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="6405" name="Convert_450076" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="6406" name="self.model.gpt_neox.layers.27.mlp.dense_4h_to_h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="5859188868" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6407" name="Convert_450079" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6408" name="self.model.gpt_neox.layers.27.mlp.dense_4h_to_h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="6409" name="self.model.gpt_neox.layers.27.mlp.dense_4h_to_h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="5859192964" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6410" name="self.model.gpt_neox.layers.27.mlp.dense_4h_to_h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="6411" name="self.model.gpt_neox.layers.27.mlp.dense_4h_to_h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="6412" name="__module.model.gpt_neox.layers.27.mlp.dense_4h_to_h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6413" name="Constant_325470" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="5859201156" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6414" name="__module.model.gpt_neox.layers.27.mlp.dense_4h_to_h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4473,input.113"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6415" name="__module.model.gpt_neox.layers.27/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4475,4477,hidden_states.57"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6416" name="__module.model.gpt_neox.layers.28.input_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6417" name="__module.model.gpt_neox.layers.28.input_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6418" name="Constant_325471" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="5859217540" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6419" name="__module.model.gpt_neox.layers.28.input_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6420" name="Constant_325472" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="5859233924" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6421" name="__module.model.gpt_neox.layers.28.input_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4487"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6422" name="self.model.gpt_neox.layers.28.attention.query_key_value.weight" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 4096" offset="5859250308" size="50331648" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6423" name="Convert_450087" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6424" name="self.model.gpt_neox.layers.28.attention.query_key_value.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 1" offset="5909581956" size="12288" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6425" name="Convert_450090" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6426" name="self.model.gpt_neox.layers.28.attention.query_key_value.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6427" name="self.model.gpt_neox.layers.28.attention.query_key_value.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="12288, 1" offset="5909594244" size="24576" /> + <output> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6428" name="self.model.gpt_neox.layers.28.attention.query_key_value.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6429" name="self.model.gpt_neox.layers.28.attention.query_key_value.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6430" name="__module.model.gpt_neox.layers.28.attention.query_key_value/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="6431" name="Constant_325473" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 12288" offset="5909618820" size="49152" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="6432" name="__module.model.gpt_neox.layers.28.attention.query_key_value/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4494,qkv.113"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="6433" name="__module.model.gpt_neox.layers.28.attention/prim::ListConstruct/Concat" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171232" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6434" name="__module.model.gpt_neox.layers.28.attention/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4498,qkv.115"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + </output> + </layer> + <layer id="6435" name="Constant_304211" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6436" name="Constant_304214" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6437" name="Constant_304217" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6438" name="__module.model.gpt_neox.layers.28.attention/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4499"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6439" name="Constant_16490" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="4500"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6440" name="__module.model.gpt_neox.layers.28.attention/aten::permute/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4501,query.169"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6441" name="Constant_304223" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6442" name="Constant_304226" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6443" name="Constant_304229" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6444" name="__module.model.gpt_neox.layers.28.attention/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4508,q.57"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6445" name="self.model.gpt_neox.layers.28.attention.rotary_emb.cos_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="257171392" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.28.attention.rotary_emb.cos_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6446" name="__module.model.gpt_neox.layers.28.attention.rotary_emb/aten::slice/Unsqueeze" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6447" name="Constant_304235" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6448" name="Constant_304238" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6449" name="Constant_304241" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6450" name="__module.model.gpt_neox.layers.28.attention/aten::slice/Slice_2" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4502"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6451" name="ShapeOf_340457" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6452" name="Constant_341054" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6453" name="Constant_340459" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6454" name="Gather_340460" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="4512"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6455" name="Constant_433366" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="6456" name="Constant_433359" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6457" name="Constant_433361" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6458" name="Constant_433363" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6459" name="Concat_433364" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6460" name="Broadcast_433367" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6461" name="ReadValue_417366" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.28.keypresent.28.key" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.28.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6462" name="Constant_402058" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6463" name="Gather_402059" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6464" name="ShapeOf_340462" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6465" name="Constant_340463" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6466" name="Constant_340464" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6467" name="Gather_340465" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="4514" /> + </output> + </layer> + <layer id="6468" name="Constant_337864" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6469" name="Reshape_340961" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6470" name="__module.model.gpt_neox.layers.28.attention/aten::add_/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="4513,4517,4518,seq_len.113"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6471" name="__module.model.gpt_neox.layers.28.attention.rotary_emb/aten::slice/Unsqueeze_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6472" name="__module.model.gpt_neox.layers.28.attention.rotary_emb/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4521,4524,cos.113"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6473" name="Constant_38395" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="6474" name="__module.model.gpt_neox.layers.28.attention/aten::index/Gather" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="4527"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6475" name="__module.model.gpt_neox.layers.28.attention/aten::unsqueeze/Unsqueeze" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="4528,cos.115"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6476" name="__module.model.gpt_neox.layers.28.attention/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4532"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6477" name="Constant_304246" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6478" name="Constant_304245" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6479" name="__module.model.gpt_neox.layers.28.attention/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6480" name="__module.model.gpt_neox.layers.28.attention/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="6481" name="__module.model.gpt_neox.layers.28.attention/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="4533,4538" /> + </output> + </layer> + <layer id="6482" name="__module.model.gpt_neox.layers.28.attention/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="6483" name="__module.model.gpt_neox.layers.28.attention/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="4535,4536,4540,4541" /> + </output> + </layer> + <layer id="6484" name="Constant_337866" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6485" name="__module.model.gpt_neox.layers.28.attention/aten::slice/Unsqueeze_17" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6486" name="Constant_304244" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6487" name="ScatterUpdate_304247" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6488" name="Constant_304250" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6489" name="Constant_304253" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6490" name="__module.model.gpt_neox.layers.28.attention/aten::slice/Slice_3" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4542,x2.113"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="6491" name="Constant_325474" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6492" name="__module.model.gpt_neox.layers.28.attention/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4543"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="6493" name="Constant_304298" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6494" name="Constant_304303" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6495" name="__module.model.gpt_neox.layers.28.attention/aten::slice/Slice_4" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4537"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="6496" name="__module.model.gpt_neox.layers.28.attention/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4545"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6497" name="self.model.gpt_neox.layers.28.attention.rotary_emb.sin_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="258220060" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.28.attention.rotary_emb.sin_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6498" name="__module.model.gpt_neox.layers.28.attention.rotary_emb/aten::slice/Unsqueeze_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6499" name="__module.model.gpt_neox.layers.28.attention.rotary_emb/aten::slice/Unsqueeze_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6500" name="__module.model.gpt_neox.layers.28.attention.rotary_emb/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4522,4525,sin.113"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6501" name="Constant_38398" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="6502" name="__module.model.gpt_neox.layers.28.attention/aten::index/Gather_1" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="4530"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6503" name="__module.model.gpt_neox.layers.28.attention/aten::unsqueeze/Unsqueeze_1" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="4531,sin.115"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6504" name="__module.model.gpt_neox.layers.28.attention/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4546"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6505" name="__module.model.gpt_neox.layers.28.attention/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4547,4565,4575,query.171,query.173"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6506" name="Constant_16504" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="4503"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6507" name="__module.model.gpt_neox.layers.28.attention/aten::permute/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4504,key.169"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6508" name="Constant_304349" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6509" name="Constant_304352" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6510" name="Constant_304355" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6511" name="__module.model.gpt_neox.layers.28.attention/aten::slice/Slice_6" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4510,k.57"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6512" name="__module.model.gpt_neox.layers.28.attention/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4548"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6513" name="Constant_304359" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6514" name="Constant_304358" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6515" name="__module.model.gpt_neox.layers.28.attention/aten::size/ShapeOf_7" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6516" name="__module.model.gpt_neox.layers.28.attention/aten::size/Constant_7" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="6517" name="__module.model.gpt_neox.layers.28.attention/aten::size/Gather_7" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="4549,4554" /> + </output> + </layer> + <layer id="6518" name="__module.model.gpt_neox.layers.28.attention/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="6519" name="__module.model.gpt_neox.layers.28.attention/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="4551,4552,4556,4557" /> + </output> + </layer> + <layer id="6520" name="Constant_337868" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6521" name="__module.model.gpt_neox.layers.28.attention/aten::slice/Unsqueeze_33" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6522" name="Constant_304357" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6523" name="ScatterUpdate_304360" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6524" name="Constant_304363" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6525" name="Constant_304366" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6526" name="__module.model.gpt_neox.layers.28.attention/aten::slice/Slice_7" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4558,x2.115"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="6527" name="Constant_325475" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6528" name="__module.model.gpt_neox.layers.28.attention/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4559"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="6529" name="Constant_304411" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6530" name="Constant_304416" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6531" name="__module.model.gpt_neox.layers.28.attention/aten::slice/Slice_8" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4553"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="6532" name="__module.model.gpt_neox.layers.28.attention/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4561"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6533" name="__module.model.gpt_neox.layers.28.attention/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4562"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6534" name="__module.model.gpt_neox.layers.28.attention/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4563,4567"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6535" name="__module.model.gpt_neox.layers.28.attention/aten::to/Convert_1" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.28.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6536" name="Constant_433379" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="6537" name="Constant_433372" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6538" name="Constant_433374" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6539" name="Constant_433376" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6540" name="Concat_433377" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6541" name="Broadcast_433380" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6542" name="ReadValue_417368" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.28.valuepresent.28.value" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.28.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6543" name="Constant_402061" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6544" name="Gather_402062" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6545" name="Constant_304461" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6546" name="Constant_304464" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6547" name="Constant_304467" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6548" name="__module.model.gpt_neox.layers.28.attention/aten::slice/Slice_10" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4505"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6549" name="Constant_16518" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="4506"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6550" name="__module.model.gpt_neox.layers.28.attention/aten::permute/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4507"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6551" name="__module.model.gpt_neox.layers.28.attention/aten::cat/Concat_5" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.28.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6552" name="__module.model.gpt_neox.layers.28.attention/aten::slice/Slice_11" type="Const" version="opset1"> + <data element_type="boolean" shape="1, 1, 2048, 2048" offset="259268636" size="4194304" /> + <output> + <port id="0" precision="BOOL" names="4584"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="6553" name="Constant_304471" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="6554" name="Constant_304470" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6555" name="ShapeOf_340467" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6556" name="Constant_340468" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6557" name="Constant_340469" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6558" name="Gather_340470" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" /> + </output> + </layer> + <layer id="6559" name="Add_340471" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="4579" /> + </output> + </layer> + <layer id="6560" name="ShapeOf_340538" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6561" name="Constant_340539" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6562" name="Constant_340540" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6563" name="Gather_340541" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="4577" /> + </output> + </layer> + <layer id="6564" name="__module.model.gpt_neox.layers.28.attention/aten::sub/Subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="4581,4582" /> + </output> + </layer> + <layer id="6565" name="Constant_337870" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6566" name="__module.model.gpt_neox.layers.28.attention/aten::slice/Unsqueeze_44" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6567" name="Constant_304469" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6568" name="ScatterUpdate_304472" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="6569" name="Constant_304473" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="6570" name="Constant_337872" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6571" name="__module.model.gpt_neox.layers.28.attention/aten::slice/Unsqueeze_45" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6572" name="ScatterUpdate_304474" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="6573" name="Constant_304477" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462964" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="6574" name="__module.model.gpt_neox.layers.28.attention/aten::slice/Slice_12" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 0" end_mask="1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + <port id="2" precision="I64"> + <dim>3</dim> + </port> + <port id="3" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="4585"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="6575" name="Constant_304550" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6576" name="Constant_304551" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6577" name="Constant_304547" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6578" name="Constant_304546" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6579" name="ScatterUpdate_304552" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6580" name="Constant_304555" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6581" name="__module.model.gpt_neox.layers.28.attention/aten::slice/Slice_13" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="4586,4587"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="6582" name="__module.model.gpt_neox.layers.28.attention/aten::where/Convert_1" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="6583" name="__module.model.gpt_neox.layers.28.attention/aten::full/Convert" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="263462988" size="4" /> + <output> + <port id="0" precision="FP32" names="4574" /> + </output> + </layer> + <layer id="6584" name="__module.model.gpt_neox.layers.28.attention/aten::where/Select" type="Select" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32" /> + <port id="2" precision="FP32" /> + </input> + <output> + <port id="3" precision="FP32" names="4588,causal_mask.113"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="6585" name="Add_317004" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="6586" name="ShapeOf_317005" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6587" name="Constant_340544" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6588" name="Constant_340545" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6589" name="Gather_340546" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="4572"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6590" name="Constant_268241" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6591" name="Constant_268243" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6592" name="Constant_268245" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6593" name="__module.model.gpt_neox.layers.28.attention/prim::ListConstruct/Concat_1" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="4589"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6594" name="Maximum_317006" type="Maximum" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6595" name="__module.model.gpt_neox.layers.28.attention/aten::add/Add_2" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4591"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="6596" name="__module.model.gpt_neox.layers.28.attention/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4592,4593,sdpa_result.57,tensor.113"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6597" name="Constant_16959" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="4594"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6598" name="__module.model.gpt_neox.layers.28.attention/aten::permute/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4595"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6599" name="__module.model.gpt_neox.layers.28.attention/prim::ListConstruct/Concat_2" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263463020" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="6600" name="__module.model.gpt_neox.layers.28.attention/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4600"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6601" name="self.model.gpt_neox.layers.28.attention.dense.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 4096" offset="5909667972" size="16777216" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6602" name="Convert_450098" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6603" name="self.model.gpt_neox.layers.28.attention.dense.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="5926445188" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6604" name="Convert_450101" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6605" name="self.model.gpt_neox.layers.28.attention.dense.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6606" name="self.model.gpt_neox.layers.28.attention.dense.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="5926449284" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6607" name="self.model.gpt_neox.layers.28.attention.dense.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6608" name="self.model.gpt_neox.layers.28.attention.dense.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6609" name="__module.model.gpt_neox.layers.28.attention.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6610" name="Constant_325476" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="5926457476" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6611" name="__module.model.gpt_neox.layers.28.attention.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4603,4605,input.115"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6612" name="__module.model.gpt_neox.layers.28/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4609,attn_output.115"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6613" name="__module.model.gpt_neox.layers.28.post_attention_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6614" name="__module.model.gpt_neox.layers.28.post_attention_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6615" name="Constant_325477" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="5926473860" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6616" name="__module.model.gpt_neox.layers.28.post_attention_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6617" name="Constant_325478" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="5926490244" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6618" name="__module.model.gpt_neox.layers.28.post_attention_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4613"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6619" name="self.model.gpt_neox.layers.28.mlp.dense_h_to_4h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 4096" offset="5926506628" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6620" name="Convert_450109" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6621" name="self.model.gpt_neox.layers.28.mlp.dense_h_to_4h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 1" offset="5993615492" size="16384" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6622" name="Convert_450112" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6623" name="self.model.gpt_neox.layers.28.mlp.dense_h_to_4h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6624" name="self.model.gpt_neox.layers.28.mlp.dense_h_to_4h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="16384, 1" offset="5993631876" size="32768" /> + <output> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6625" name="self.model.gpt_neox.layers.28.mlp.dense_h_to_4h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6626" name="self.model.gpt_neox.layers.28.mlp.dense_h_to_4h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6627" name="__module.model.gpt_neox.layers.28.mlp.dense_h_to_4h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="6628" name="Constant_325479" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 16384" offset="5993664644" size="65536" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="6629" name="__module.model.gpt_neox.layers.28.mlp.dense_h_to_4h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4618"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="6630" name="__module.model.gpt_neox.layers.28.mlp.act/aten::gelu/Gelu" type="Gelu" version="opset7"> + <data approximation_mode="ERF" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="4619"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="6631" name="self.model.gpt_neox.layers.28.mlp.dense_4h_to_h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 16384" offset="5993730180" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="6632" name="Convert_450120" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="6633" name="self.model.gpt_neox.layers.28.mlp.dense_4h_to_h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="6060839044" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6634" name="Convert_450123" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6635" name="self.model.gpt_neox.layers.28.mlp.dense_4h_to_h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="6636" name="self.model.gpt_neox.layers.28.mlp.dense_4h_to_h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="6060843140" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6637" name="self.model.gpt_neox.layers.28.mlp.dense_4h_to_h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="6638" name="self.model.gpt_neox.layers.28.mlp.dense_4h_to_h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="6639" name="__module.model.gpt_neox.layers.28.mlp.dense_4h_to_h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6640" name="Constant_325480" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="6060851332" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6641" name="__module.model.gpt_neox.layers.28.mlp.dense_4h_to_h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4622,input.117"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6642" name="__module.model.gpt_neox.layers.28/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4624,4626,hidden_states.59"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6643" name="__module.model.gpt_neox.layers.29.input_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6644" name="__module.model.gpt_neox.layers.29.input_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6645" name="Constant_325481" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="6060867716" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6646" name="__module.model.gpt_neox.layers.29.input_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6647" name="Constant_325482" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="6060884100" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6648" name="__module.model.gpt_neox.layers.29.input_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4636"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6649" name="self.model.gpt_neox.layers.29.attention.query_key_value.weight" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 4096" offset="6060900484" size="50331648" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6650" name="Convert_450131" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6651" name="self.model.gpt_neox.layers.29.attention.query_key_value.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 1" offset="6111232132" size="12288" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6652" name="Convert_450134" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6653" name="self.model.gpt_neox.layers.29.attention.query_key_value.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6654" name="self.model.gpt_neox.layers.29.attention.query_key_value.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="12288, 1" offset="6111244420" size="24576" /> + <output> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6655" name="self.model.gpt_neox.layers.29.attention.query_key_value.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6656" name="self.model.gpt_neox.layers.29.attention.query_key_value.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6657" name="__module.model.gpt_neox.layers.29.attention.query_key_value/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="6658" name="Constant_325483" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 12288" offset="6111268996" size="49152" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="6659" name="__module.model.gpt_neox.layers.29.attention.query_key_value/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4643,qkv.117"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="6660" name="__module.model.gpt_neox.layers.29.attention/prim::ListConstruct/Concat" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171232" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6661" name="__module.model.gpt_neox.layers.29.attention/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4647,qkv.119"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + </output> + </layer> + <layer id="6662" name="Constant_304562" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6663" name="Constant_304565" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6664" name="Constant_304568" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6665" name="__module.model.gpt_neox.layers.29.attention/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4648"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6666" name="Constant_17071" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="4649"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6667" name="__module.model.gpt_neox.layers.29.attention/aten::permute/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4650,query.175"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6668" name="Constant_304574" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6669" name="Constant_304577" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6670" name="Constant_304580" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6671" name="__module.model.gpt_neox.layers.29.attention/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4657,q.59"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6672" name="self.model.gpt_neox.layers.29.attention.rotary_emb.cos_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="257171392" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.29.attention.rotary_emb.cos_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6673" name="__module.model.gpt_neox.layers.29.attention.rotary_emb/aten::slice/Unsqueeze" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6674" name="Constant_304586" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6675" name="Constant_304589" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6676" name="Constant_304592" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6677" name="__module.model.gpt_neox.layers.29.attention/aten::slice/Slice_2" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4651"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6678" name="ShapeOf_340548" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6679" name="Constant_341057" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6680" name="Constant_340550" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6681" name="Gather_340551" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="4661"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6682" name="Constant_433392" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="6683" name="Constant_433385" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6684" name="Constant_433387" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6685" name="Constant_433389" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6686" name="Concat_433390" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6687" name="Broadcast_433393" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6688" name="ReadValue_417370" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.29.keypresent.29.key" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.29.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6689" name="Constant_402064" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6690" name="Gather_402065" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6691" name="ShapeOf_340553" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6692" name="Constant_340554" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6693" name="Constant_340555" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6694" name="Gather_340556" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="4663" /> + </output> + </layer> + <layer id="6695" name="Constant_337874" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6696" name="Reshape_340963" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6697" name="__module.model.gpt_neox.layers.29.attention/aten::add_/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="4662,4666,4667,seq_len.117"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6698" name="__module.model.gpt_neox.layers.29.attention.rotary_emb/aten::slice/Unsqueeze_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6699" name="__module.model.gpt_neox.layers.29.attention.rotary_emb/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4670,4673,cos.117"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6700" name="Constant_38401" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="6701" name="__module.model.gpt_neox.layers.29.attention/aten::index/Gather" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="4676"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6702" name="__module.model.gpt_neox.layers.29.attention/aten::unsqueeze/Unsqueeze" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="4677,cos.119"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6703" name="__module.model.gpt_neox.layers.29.attention/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4681"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6704" name="Constant_304597" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6705" name="Constant_304596" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6706" name="__module.model.gpt_neox.layers.29.attention/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6707" name="__module.model.gpt_neox.layers.29.attention/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="6708" name="__module.model.gpt_neox.layers.29.attention/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="4682,4687" /> + </output> + </layer> + <layer id="6709" name="__module.model.gpt_neox.layers.29.attention/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="6710" name="__module.model.gpt_neox.layers.29.attention/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="4684,4685,4689,4690" /> + </output> + </layer> + <layer id="6711" name="Constant_337876" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6712" name="__module.model.gpt_neox.layers.29.attention/aten::slice/Unsqueeze_17" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6713" name="Constant_304595" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6714" name="ScatterUpdate_304598" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6715" name="Constant_304601" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6716" name="Constant_304604" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6717" name="__module.model.gpt_neox.layers.29.attention/aten::slice/Slice_3" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4691,x2.117"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="6718" name="Constant_325484" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6719" name="__module.model.gpt_neox.layers.29.attention/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4692"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="6720" name="Constant_304649" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6721" name="Constant_304654" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6722" name="__module.model.gpt_neox.layers.29.attention/aten::slice/Slice_4" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4686"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="6723" name="__module.model.gpt_neox.layers.29.attention/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4694"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6724" name="self.model.gpt_neox.layers.29.attention.rotary_emb.sin_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="258220060" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.29.attention.rotary_emb.sin_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6725" name="__module.model.gpt_neox.layers.29.attention.rotary_emb/aten::slice/Unsqueeze_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6726" name="__module.model.gpt_neox.layers.29.attention.rotary_emb/aten::slice/Unsqueeze_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6727" name="__module.model.gpt_neox.layers.29.attention.rotary_emb/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4671,4674,sin.117"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6728" name="Constant_38404" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="6729" name="__module.model.gpt_neox.layers.29.attention/aten::index/Gather_1" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="4679"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6730" name="__module.model.gpt_neox.layers.29.attention/aten::unsqueeze/Unsqueeze_1" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="4680,sin.119"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6731" name="__module.model.gpt_neox.layers.29.attention/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4695"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6732" name="__module.model.gpt_neox.layers.29.attention/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4696,4714,4724,query.177,query.179"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6733" name="Constant_17085" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="4652"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6734" name="__module.model.gpt_neox.layers.29.attention/aten::permute/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4653,key.175"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6735" name="Constant_304700" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6736" name="Constant_304703" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6737" name="Constant_304706" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6738" name="__module.model.gpt_neox.layers.29.attention/aten::slice/Slice_6" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4659,k.59"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6739" name="__module.model.gpt_neox.layers.29.attention/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4697"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6740" name="Constant_304710" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6741" name="Constant_304709" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6742" name="__module.model.gpt_neox.layers.29.attention/aten::size/ShapeOf_7" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6743" name="__module.model.gpt_neox.layers.29.attention/aten::size/Constant_7" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="6744" name="__module.model.gpt_neox.layers.29.attention/aten::size/Gather_7" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="4698,4703" /> + </output> + </layer> + <layer id="6745" name="__module.model.gpt_neox.layers.29.attention/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="6746" name="__module.model.gpt_neox.layers.29.attention/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="4700,4701,4705,4706" /> + </output> + </layer> + <layer id="6747" name="Constant_337878" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6748" name="__module.model.gpt_neox.layers.29.attention/aten::slice/Unsqueeze_33" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6749" name="Constant_304708" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6750" name="ScatterUpdate_304711" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6751" name="Constant_304714" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6752" name="Constant_304717" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6753" name="__module.model.gpt_neox.layers.29.attention/aten::slice/Slice_7" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4707,x2.119"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="6754" name="Constant_325485" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6755" name="__module.model.gpt_neox.layers.29.attention/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4708"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="6756" name="Constant_304762" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6757" name="Constant_304767" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6758" name="__module.model.gpt_neox.layers.29.attention/aten::slice/Slice_8" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4702"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="6759" name="__module.model.gpt_neox.layers.29.attention/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4710"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6760" name="__module.model.gpt_neox.layers.29.attention/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4711"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6761" name="__module.model.gpt_neox.layers.29.attention/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4712,4716"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6762" name="__module.model.gpt_neox.layers.29.attention/aten::to/Convert_1" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.29.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6763" name="Constant_433405" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="6764" name="Constant_433398" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6765" name="Constant_433400" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6766" name="Constant_433402" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6767" name="Concat_433403" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6768" name="Broadcast_433406" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6769" name="ReadValue_417372" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.29.valuepresent.29.value" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.29.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6770" name="Constant_402067" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6771" name="Gather_402068" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6772" name="Constant_304812" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6773" name="Constant_304815" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6774" name="Constant_304818" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6775" name="__module.model.gpt_neox.layers.29.attention/aten::slice/Slice_10" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4654"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6776" name="Constant_17099" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="4655"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6777" name="__module.model.gpt_neox.layers.29.attention/aten::permute/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4656"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6778" name="__module.model.gpt_neox.layers.29.attention/aten::cat/Concat_5" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.29.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6779" name="__module.model.gpt_neox.layers.29.attention/aten::slice/Slice_11" type="Const" version="opset1"> + <data element_type="boolean" shape="1, 1, 2048, 2048" offset="259268636" size="4194304" /> + <output> + <port id="0" precision="BOOL" names="4733"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="6780" name="Constant_304822" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="6781" name="Constant_304821" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6782" name="ShapeOf_340558" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6783" name="Constant_340559" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6784" name="Constant_340560" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6785" name="Gather_340561" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" /> + </output> + </layer> + <layer id="6786" name="Add_340562" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="4728" /> + </output> + </layer> + <layer id="6787" name="ShapeOf_340629" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6788" name="Constant_340630" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6789" name="Constant_340631" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6790" name="Gather_340632" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="4726" /> + </output> + </layer> + <layer id="6791" name="__module.model.gpt_neox.layers.29.attention/aten::sub/Subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="4730,4731" /> + </output> + </layer> + <layer id="6792" name="Constant_337880" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6793" name="__module.model.gpt_neox.layers.29.attention/aten::slice/Unsqueeze_44" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6794" name="Constant_304820" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6795" name="ScatterUpdate_304823" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="6796" name="Constant_304824" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="6797" name="Constant_337882" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6798" name="__module.model.gpt_neox.layers.29.attention/aten::slice/Unsqueeze_45" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6799" name="ScatterUpdate_304825" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="6800" name="Constant_304828" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462964" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="6801" name="__module.model.gpt_neox.layers.29.attention/aten::slice/Slice_12" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 0" end_mask="1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + <port id="2" precision="I64"> + <dim>3</dim> + </port> + <port id="3" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="4734"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="6802" name="Constant_304901" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6803" name="Constant_304902" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6804" name="Constant_304898" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6805" name="Constant_304897" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6806" name="ScatterUpdate_304903" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6807" name="Constant_304906" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6808" name="__module.model.gpt_neox.layers.29.attention/aten::slice/Slice_13" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="4735,4736"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="6809" name="__module.model.gpt_neox.layers.29.attention/aten::where/Convert_1" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="6810" name="__module.model.gpt_neox.layers.29.attention/aten::full/Convert" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="263462988" size="4" /> + <output> + <port id="0" precision="FP32" names="4723" /> + </output> + </layer> + <layer id="6811" name="__module.model.gpt_neox.layers.29.attention/aten::where/Select" type="Select" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32" /> + <port id="2" precision="FP32" /> + </input> + <output> + <port id="3" precision="FP32" names="4737,causal_mask.117"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="6812" name="Add_317076" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="6813" name="ShapeOf_317077" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6814" name="Constant_340635" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6815" name="Constant_340636" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6816" name="Gather_340637" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="4721"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6817" name="Constant_268251" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6818" name="Constant_268253" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6819" name="Constant_268255" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6820" name="__module.model.gpt_neox.layers.29.attention/prim::ListConstruct/Concat_1" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="4738"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6821" name="Maximum_317078" type="Maximum" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6822" name="__module.model.gpt_neox.layers.29.attention/aten::add/Add_2" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4740"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="6823" name="__module.model.gpt_neox.layers.29.attention/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4741,4742,sdpa_result.59,tensor.117"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6824" name="Constant_17540" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="4743"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6825" name="__module.model.gpt_neox.layers.29.attention/aten::permute/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4744"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6826" name="__module.model.gpt_neox.layers.29.attention/prim::ListConstruct/Concat_2" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263463020" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="6827" name="__module.model.gpt_neox.layers.29.attention/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4749"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6828" name="self.model.gpt_neox.layers.29.attention.dense.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 4096" offset="6111318148" size="16777216" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6829" name="Convert_450142" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6830" name="self.model.gpt_neox.layers.29.attention.dense.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="6128095364" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6831" name="Convert_450145" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6832" name="self.model.gpt_neox.layers.29.attention.dense.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6833" name="self.model.gpt_neox.layers.29.attention.dense.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="6128099460" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6834" name="self.model.gpt_neox.layers.29.attention.dense.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6835" name="self.model.gpt_neox.layers.29.attention.dense.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6836" name="__module.model.gpt_neox.layers.29.attention.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6837" name="Constant_325486" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="6128107652" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6838" name="__module.model.gpt_neox.layers.29.attention.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4752,4754,input.119"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6839" name="__module.model.gpt_neox.layers.29/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4758,attn_output.119"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6840" name="__module.model.gpt_neox.layers.29.post_attention_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6841" name="__module.model.gpt_neox.layers.29.post_attention_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6842" name="Constant_325487" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="6128124036" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6843" name="__module.model.gpt_neox.layers.29.post_attention_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6844" name="Constant_325488" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="6128140420" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6845" name="__module.model.gpt_neox.layers.29.post_attention_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4762"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6846" name="self.model.gpt_neox.layers.29.mlp.dense_h_to_4h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 4096" offset="6128156804" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6847" name="Convert_450153" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6848" name="self.model.gpt_neox.layers.29.mlp.dense_h_to_4h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 1" offset="6195265668" size="16384" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6849" name="Convert_450156" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6850" name="self.model.gpt_neox.layers.29.mlp.dense_h_to_4h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6851" name="self.model.gpt_neox.layers.29.mlp.dense_h_to_4h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="16384, 1" offset="6195282052" size="32768" /> + <output> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6852" name="self.model.gpt_neox.layers.29.mlp.dense_h_to_4h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6853" name="self.model.gpt_neox.layers.29.mlp.dense_h_to_4h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6854" name="__module.model.gpt_neox.layers.29.mlp.dense_h_to_4h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="6855" name="Constant_325489" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 16384" offset="6195314820" size="65536" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="6856" name="__module.model.gpt_neox.layers.29.mlp.dense_h_to_4h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4767"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="6857" name="__module.model.gpt_neox.layers.29.mlp.act/aten::gelu/Gelu" type="Gelu" version="opset7"> + <data approximation_mode="ERF" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="4768"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="6858" name="self.model.gpt_neox.layers.29.mlp.dense_4h_to_h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 16384" offset="6195380356" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="6859" name="Convert_450164" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="6860" name="self.model.gpt_neox.layers.29.mlp.dense_4h_to_h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="6262489220" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6861" name="Convert_450167" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6862" name="self.model.gpt_neox.layers.29.mlp.dense_4h_to_h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="6863" name="self.model.gpt_neox.layers.29.mlp.dense_4h_to_h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="6262493316" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6864" name="self.model.gpt_neox.layers.29.mlp.dense_4h_to_h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="6865" name="self.model.gpt_neox.layers.29.mlp.dense_4h_to_h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="6866" name="__module.model.gpt_neox.layers.29.mlp.dense_4h_to_h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6867" name="Constant_325490" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="6262501508" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6868" name="__module.model.gpt_neox.layers.29.mlp.dense_4h_to_h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4771,input.121"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6869" name="__module.model.gpt_neox.layers.29/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4773,4775,hidden_states.61"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6870" name="__module.model.gpt_neox.layers.30.input_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6871" name="__module.model.gpt_neox.layers.30.input_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6872" name="Constant_325491" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="6262517892" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6873" name="__module.model.gpt_neox.layers.30.input_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6874" name="Constant_325492" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="6262534276" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6875" name="__module.model.gpt_neox.layers.30.input_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4785"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6876" name="self.model.gpt_neox.layers.30.attention.query_key_value.weight" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 4096" offset="6262550660" size="50331648" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6877" name="Convert_450175" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6878" name="self.model.gpt_neox.layers.30.attention.query_key_value.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 1" offset="6312882308" size="12288" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6879" name="Convert_450178" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6880" name="self.model.gpt_neox.layers.30.attention.query_key_value.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6881" name="self.model.gpt_neox.layers.30.attention.query_key_value.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="12288, 1" offset="6312894596" size="24576" /> + <output> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6882" name="self.model.gpt_neox.layers.30.attention.query_key_value.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6883" name="self.model.gpt_neox.layers.30.attention.query_key_value.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="6884" name="__module.model.gpt_neox.layers.30.attention.query_key_value/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="6885" name="Constant_325493" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 12288" offset="6312919172" size="49152" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="6886" name="__module.model.gpt_neox.layers.30.attention.query_key_value/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4792,qkv.121"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="6887" name="__module.model.gpt_neox.layers.30.attention/prim::ListConstruct/Concat" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171232" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6888" name="__module.model.gpt_neox.layers.30.attention/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4796,qkv.123"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + </output> + </layer> + <layer id="6889" name="Constant_304913" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6890" name="Constant_304916" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6891" name="Constant_304919" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6892" name="__module.model.gpt_neox.layers.30.attention/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4797"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6893" name="Constant_17652" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="4798"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6894" name="__module.model.gpt_neox.layers.30.attention/aten::permute/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4799,query.181"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6895" name="Constant_304925" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6896" name="Constant_304928" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6897" name="Constant_304931" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6898" name="__module.model.gpt_neox.layers.30.attention/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4806,q.61"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6899" name="self.model.gpt_neox.layers.30.attention.rotary_emb.cos_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="257171392" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.30.attention.rotary_emb.cos_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6900" name="__module.model.gpt_neox.layers.30.attention.rotary_emb/aten::slice/Unsqueeze" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6901" name="Constant_304937" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6902" name="Constant_304940" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6903" name="Constant_304943" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6904" name="__module.model.gpt_neox.layers.30.attention/aten::slice/Slice_2" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4800"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6905" name="ShapeOf_340639" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6906" name="Constant_341060" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6907" name="Constant_340641" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6908" name="Gather_340642" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="4810"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6909" name="Constant_433418" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="6910" name="Constant_433411" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6911" name="Constant_433413" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6912" name="Constant_433415" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6913" name="Concat_433416" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6914" name="Broadcast_433419" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6915" name="ReadValue_417378" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.30.keypresent.30.key" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.30.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6916" name="Constant_402070" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6917" name="Gather_402071" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6918" name="ShapeOf_340644" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6919" name="Constant_340645" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6920" name="Constant_340646" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6921" name="Gather_340647" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="4812" /> + </output> + </layer> + <layer id="6922" name="Constant_337884" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6923" name="Reshape_340965" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6924" name="__module.model.gpt_neox.layers.30.attention/aten::add_/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="4811,4815,4816,seq_len.121"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6925" name="__module.model.gpt_neox.layers.30.attention.rotary_emb/aten::slice/Unsqueeze_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6926" name="__module.model.gpt_neox.layers.30.attention.rotary_emb/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4819,4822,cos.121"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6927" name="Constant_38407" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="6928" name="__module.model.gpt_neox.layers.30.attention/aten::index/Gather" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="4825"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6929" name="__module.model.gpt_neox.layers.30.attention/aten::unsqueeze/Unsqueeze" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="4826,cos.123"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6930" name="__module.model.gpt_neox.layers.30.attention/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4830"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6931" name="Constant_304948" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6932" name="Constant_304947" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6933" name="__module.model.gpt_neox.layers.30.attention/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6934" name="__module.model.gpt_neox.layers.30.attention/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="6935" name="__module.model.gpt_neox.layers.30.attention/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="4831,4836" /> + </output> + </layer> + <layer id="6936" name="__module.model.gpt_neox.layers.30.attention/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="6937" name="__module.model.gpt_neox.layers.30.attention/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="4833,4834,4838,4839" /> + </output> + </layer> + <layer id="6938" name="Constant_337886" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6939" name="__module.model.gpt_neox.layers.30.attention/aten::slice/Unsqueeze_17" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6940" name="Constant_304946" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6941" name="ScatterUpdate_304949" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6942" name="Constant_304952" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6943" name="Constant_304955" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6944" name="__module.model.gpt_neox.layers.30.attention/aten::slice/Slice_3" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4840,x2.121"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="6945" name="Constant_325494" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6946" name="__module.model.gpt_neox.layers.30.attention/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4841"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="6947" name="Constant_305000" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6948" name="Constant_305005" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6949" name="__module.model.gpt_neox.layers.30.attention/aten::slice/Slice_4" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4835"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="6950" name="__module.model.gpt_neox.layers.30.attention/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4843"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6951" name="self.model.gpt_neox.layers.30.attention.rotary_emb.sin_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="258220060" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.30.attention.rotary_emb.sin_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6952" name="__module.model.gpt_neox.layers.30.attention.rotary_emb/aten::slice/Unsqueeze_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6953" name="__module.model.gpt_neox.layers.30.attention.rotary_emb/aten::slice/Unsqueeze_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6954" name="__module.model.gpt_neox.layers.30.attention.rotary_emb/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4820,4823,sin.121"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6955" name="Constant_38410" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="6956" name="__module.model.gpt_neox.layers.30.attention/aten::index/Gather_1" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="4828"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6957" name="__module.model.gpt_neox.layers.30.attention/aten::unsqueeze/Unsqueeze_1" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="4829,sin.123"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6958" name="__module.model.gpt_neox.layers.30.attention/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4844"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6959" name="__module.model.gpt_neox.layers.30.attention/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4845,4863,4873,query.183,query.185"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6960" name="Constant_17666" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="4801"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6961" name="__module.model.gpt_neox.layers.30.attention/aten::permute/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4802,key.181"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6962" name="Constant_305051" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6963" name="Constant_305054" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6964" name="Constant_305057" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6965" name="__module.model.gpt_neox.layers.30.attention/aten::slice/Slice_6" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4808,k.61"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6966" name="__module.model.gpt_neox.layers.30.attention/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4846"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6967" name="Constant_305061" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6968" name="Constant_305060" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6969" name="__module.model.gpt_neox.layers.30.attention/aten::size/ShapeOf_7" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6970" name="__module.model.gpt_neox.layers.30.attention/aten::size/Constant_7" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="6971" name="__module.model.gpt_neox.layers.30.attention/aten::size/Gather_7" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="4847,4852" /> + </output> + </layer> + <layer id="6972" name="__module.model.gpt_neox.layers.30.attention/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="6973" name="__module.model.gpt_neox.layers.30.attention/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="4849,4850,4854,4855" /> + </output> + </layer> + <layer id="6974" name="Constant_337888" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6975" name="__module.model.gpt_neox.layers.30.attention/aten::slice/Unsqueeze_33" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6976" name="Constant_305059" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6977" name="ScatterUpdate_305062" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6978" name="Constant_305065" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6979" name="Constant_305068" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6980" name="__module.model.gpt_neox.layers.30.attention/aten::slice/Slice_7" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4856,x2.123"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="6981" name="Constant_325495" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6982" name="__module.model.gpt_neox.layers.30.attention/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4857"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="6983" name="Constant_305113" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6984" name="Constant_305118" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6985" name="__module.model.gpt_neox.layers.30.attention/aten::slice/Slice_8" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4851"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="6986" name="__module.model.gpt_neox.layers.30.attention/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4859"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6987" name="__module.model.gpt_neox.layers.30.attention/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4860"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6988" name="__module.model.gpt_neox.layers.30.attention/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4861,4865"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6989" name="__module.model.gpt_neox.layers.30.attention/aten::to/Convert_1" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.30.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6990" name="Constant_433431" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="6991" name="Constant_433424" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6992" name="Constant_433426" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6993" name="Constant_433428" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6994" name="Concat_433429" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6995" name="Broadcast_433432" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6996" name="ReadValue_417380" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.30.valuepresent.30.value" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.30.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6997" name="Constant_402073" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6998" name="Gather_402074" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6999" name="Constant_305163" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7000" name="Constant_305166" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7001" name="Constant_305169" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7002" name="__module.model.gpt_neox.layers.30.attention/aten::slice/Slice_10" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4803"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7003" name="Constant_17680" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="4804"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7004" name="__module.model.gpt_neox.layers.30.attention/aten::permute/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4805"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7005" name="__module.model.gpt_neox.layers.30.attention/aten::cat/Concat_5" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.30.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7006" name="__module.model.gpt_neox.layers.30.attention/aten::slice/Slice_11" type="Const" version="opset1"> + <data element_type="boolean" shape="1, 1, 2048, 2048" offset="259268636" size="4194304" /> + <output> + <port id="0" precision="BOOL" names="4882"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="7007" name="Constant_305173" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="7008" name="Constant_305172" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7009" name="ShapeOf_340649" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7010" name="Constant_340650" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="7011" name="Constant_340651" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="7012" name="Gather_340652" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" /> + </output> + </layer> + <layer id="7013" name="Add_340653" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="4877" /> + </output> + </layer> + <layer id="7014" name="ShapeOf_340720" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7015" name="Constant_340721" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="7016" name="Constant_340722" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="7017" name="Gather_340723" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="4875" /> + </output> + </layer> + <layer id="7018" name="__module.model.gpt_neox.layers.30.attention/aten::sub/Subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="4879,4880" /> + </output> + </layer> + <layer id="7019" name="Constant_337890" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7020" name="__module.model.gpt_neox.layers.30.attention/aten::slice/Unsqueeze_44" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7021" name="Constant_305171" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7022" name="ScatterUpdate_305174" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="7023" name="Constant_305175" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="7024" name="Constant_337892" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7025" name="__module.model.gpt_neox.layers.30.attention/aten::slice/Unsqueeze_45" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7026" name="ScatterUpdate_305176" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="7027" name="Constant_305179" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462964" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="7028" name="__module.model.gpt_neox.layers.30.attention/aten::slice/Slice_12" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 0" end_mask="1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + <port id="2" precision="I64"> + <dim>3</dim> + </port> + <port id="3" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="4883"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="7029" name="Constant_305252" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7030" name="Constant_305253" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7031" name="Constant_305249" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7032" name="Constant_305248" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7033" name="ScatterUpdate_305254" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7034" name="Constant_305257" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7035" name="__module.model.gpt_neox.layers.30.attention/aten::slice/Slice_13" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="4884,4885"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="7036" name="__module.model.gpt_neox.layers.30.attention/aten::where/Convert_1" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="7037" name="__module.model.gpt_neox.layers.30.attention/aten::full/Convert" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="263462988" size="4" /> + <output> + <port id="0" precision="FP32" names="4872" /> + </output> + </layer> + <layer id="7038" name="__module.model.gpt_neox.layers.30.attention/aten::where/Select" type="Select" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32" /> + <port id="2" precision="FP32" /> + </input> + <output> + <port id="3" precision="FP32" names="4886,causal_mask.121"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="7039" name="Add_317148" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="7040" name="ShapeOf_317149" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7041" name="Constant_340726" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7042" name="Constant_340727" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="7043" name="Gather_340728" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="4870"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7044" name="Constant_268261" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7045" name="Constant_268263" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7046" name="Constant_268265" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7047" name="__module.model.gpt_neox.layers.30.attention/prim::ListConstruct/Concat_1" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="4887"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7048" name="Maximum_317150" type="Maximum" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7049" name="__module.model.gpt_neox.layers.30.attention/aten::add/Add_2" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4889"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="7050" name="__module.model.gpt_neox.layers.30.attention/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4890,4891,sdpa_result.61,tensor.121"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7051" name="Constant_18121" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="4892"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7052" name="__module.model.gpt_neox.layers.30.attention/aten::permute/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4893"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7053" name="__module.model.gpt_neox.layers.30.attention/prim::ListConstruct/Concat_2" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263463020" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="7054" name="__module.model.gpt_neox.layers.30.attention/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4898"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7055" name="self.model.gpt_neox.layers.30.attention.dense.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 4096" offset="6312968324" size="16777216" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7056" name="Convert_450186" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7057" name="self.model.gpt_neox.layers.30.attention.dense.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="6329745540" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7058" name="Convert_450189" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7059" name="self.model.gpt_neox.layers.30.attention.dense.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7060" name="self.model.gpt_neox.layers.30.attention.dense.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="6329749636" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7061" name="self.model.gpt_neox.layers.30.attention.dense.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7062" name="self.model.gpt_neox.layers.30.attention.dense.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7063" name="__module.model.gpt_neox.layers.30.attention.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7064" name="Constant_325496" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="6329757828" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7065" name="__module.model.gpt_neox.layers.30.attention.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4901,4903,input.123"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7066" name="__module.model.gpt_neox.layers.30/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4907,attn_output.123"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7067" name="__module.model.gpt_neox.layers.30.post_attention_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7068" name="__module.model.gpt_neox.layers.30.post_attention_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7069" name="Constant_325497" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="6329774212" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7070" name="__module.model.gpt_neox.layers.30.post_attention_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7071" name="Constant_325498" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="6329790596" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7072" name="__module.model.gpt_neox.layers.30.post_attention_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4911"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7073" name="self.model.gpt_neox.layers.30.mlp.dense_h_to_4h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 4096" offset="6329806980" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7074" name="Convert_450197" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7075" name="self.model.gpt_neox.layers.30.mlp.dense_h_to_4h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 1" offset="6396915844" size="16384" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7076" name="Convert_450200" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7077" name="self.model.gpt_neox.layers.30.mlp.dense_h_to_4h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7078" name="self.model.gpt_neox.layers.30.mlp.dense_h_to_4h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="16384, 1" offset="6396932228" size="32768" /> + <output> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7079" name="self.model.gpt_neox.layers.30.mlp.dense_h_to_4h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7080" name="self.model.gpt_neox.layers.30.mlp.dense_h_to_4h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7081" name="__module.model.gpt_neox.layers.30.mlp.dense_h_to_4h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="7082" name="Constant_325499" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 16384" offset="6396964996" size="65536" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="7083" name="__module.model.gpt_neox.layers.30.mlp.dense_h_to_4h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4916"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="7084" name="__module.model.gpt_neox.layers.30.mlp.act/aten::gelu/Gelu" type="Gelu" version="opset7"> + <data approximation_mode="ERF" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="4917"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="7085" name="self.model.gpt_neox.layers.30.mlp.dense_4h_to_h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 16384" offset="6397030532" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="7086" name="Convert_450208" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="7087" name="self.model.gpt_neox.layers.30.mlp.dense_4h_to_h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="6464139396" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7088" name="Convert_450211" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7089" name="self.model.gpt_neox.layers.30.mlp.dense_4h_to_h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="7090" name="self.model.gpt_neox.layers.30.mlp.dense_4h_to_h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="6464143492" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7091" name="self.model.gpt_neox.layers.30.mlp.dense_4h_to_h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="7092" name="self.model.gpt_neox.layers.30.mlp.dense_4h_to_h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="7093" name="__module.model.gpt_neox.layers.30.mlp.dense_4h_to_h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7094" name="Constant_325500" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="6464151684" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7095" name="__module.model.gpt_neox.layers.30.mlp.dense_4h_to_h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4920,input.125"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7096" name="__module.model.gpt_neox.layers.30/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4922,4924,hidden_states"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7097" name="__module.model.gpt_neox.layers.31.input_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7098" name="__module.model.gpt_neox.layers.31.input_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7099" name="Constant_325501" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="6464168068" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7100" name="__module.model.gpt_neox.layers.31.input_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7101" name="Constant_325502" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="6464184452" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7102" name="__module.model.gpt_neox.layers.31.input_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4934"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7103" name="self.model.gpt_neox.layers.31.attention.query_key_value.weight" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 4096" offset="6464200836" size="50331648" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7104" name="Convert_450219" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7105" name="self.model.gpt_neox.layers.31.attention.query_key_value.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="12288, 1" offset="6514532484" size="12288" /> + <output> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7106" name="Convert_450222" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7107" name="self.model.gpt_neox.layers.31.attention.query_key_value.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7108" name="self.model.gpt_neox.layers.31.attention.query_key_value.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="12288, 1" offset="6514544772" size="24576" /> + <output> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7109" name="self.model.gpt_neox.layers.31.attention.query_key_value.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>12288</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7110" name="self.model.gpt_neox.layers.31.attention.query_key_value.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7111" name="__module.model.gpt_neox.layers.31.attention.query_key_value/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>12288</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="7112" name="Constant_325503" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 12288" offset="6514569348" size="49152" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="7113" name="__module.model.gpt_neox.layers.31.attention.query_key_value/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>12288</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4941,qkv.125"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + </output> + </layer> + <layer id="7114" name="__module.model.gpt_neox.layers.31.attention/prim::ListConstruct/Concat" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171232" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7115" name="__module.model.gpt_neox.layers.31.attention/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12288</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4945,qkv"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + </output> + </layer> + <layer id="7116" name="Constant_305264" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7117" name="Constant_305267" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7118" name="Constant_305270" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7119" name="__module.model.gpt_neox.layers.31.attention/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4952"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7120" name="Constant_18261" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="4953"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7121" name="__module.model.gpt_neox.layers.31.attention/aten::permute/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4954"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7122" name="__module.model.gpt_neox.layers.31.attention/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.31.value"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7124" name="Constant_433444" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="7125" name="Constant_433437" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7126" name="Constant_433439" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7127" name="Constant_433441" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7128" name="Concat_433442" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7129" name="Broadcast_433445" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7130" name="ReadValue_417382" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.31.keypresent.31.key" variable_type="f32" variable_shape="?,32,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.31.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7131" name="Constant_402076" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="7132" name="Gather_402077" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7133" name="Constant_305276" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7134" name="Constant_305279" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258219968" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7135" name="Constant_305282" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7136" name="__module.model.gpt_neox.layers.31.attention/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4949"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7137" name="Constant_18247" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="4950"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7138" name="__module.model.gpt_neox.layers.31.attention/aten::permute/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4951,key.187"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7139" name="Constant_305288" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7140" name="Constant_305291" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7141" name="Constant_305294" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7142" name="__module.model.gpt_neox.layers.31.attention/aten::slice/Slice_2" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4957,k"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7143" name="self.model.gpt_neox.layers.31.attention.rotary_emb.cos_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="257171392" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.31.attention.rotary_emb.cos_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7144" name="__module.model.gpt_neox.layers.31.attention.rotary_emb/aten::slice/Unsqueeze" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7145" name="ShapeOf_340730" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7146" name="Constant_341063" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7147" name="Constant_340732" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="7148" name="Gather_340733" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="4959"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7149" name="ShapeOf_340735" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7150" name="Constant_341066" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7151" name="Constant_340737" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="7152" name="Gather_340738" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="4961"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7153" name="__module.model.gpt_neox.layers.31.attention/aten::add_/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="4960,4964,4965,seq_len.125"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7154" name="__module.model.gpt_neox.layers.31.attention.rotary_emb/aten::slice/Unsqueeze_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7155" name="__module.model.gpt_neox.layers.31.attention.rotary_emb/aten::slice/Slice" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4968,4971,cos.125"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7156" name="Constant_38413" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="7157" name="__module.model.gpt_neox.layers.31.attention/aten::index/Gather" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="4974"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7158" name="__module.model.gpt_neox.layers.31.attention/aten::unsqueeze/Unsqueeze" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="4975,cos"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7159" name="__module.model.gpt_neox.layers.31.attention/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4995"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7160" name="Constant_305299" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7161" name="Constant_305298" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7162" name="__module.model.gpt_neox.layers.31.attention/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7163" name="__module.model.gpt_neox.layers.31.attention/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="7164" name="__module.model.gpt_neox.layers.31.attention/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="4996,5001" /> + </output> + </layer> + <layer id="7165" name="__module.model.gpt_neox.layers.31.attention/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="7166" name="__module.model.gpt_neox.layers.31.attention/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="4998,4999,5003,5004" /> + </output> + </layer> + <layer id="7167" name="Constant_337896" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7168" name="__module.model.gpt_neox.layers.31.attention/aten::slice/Unsqueeze_17" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7169" name="Constant_305297" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7170" name="ScatterUpdate_305300" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7171" name="Constant_305303" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7172" name="Constant_305306" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7173" name="__module.model.gpt_neox.layers.31.attention/aten::slice/Slice_3" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="5005,x2"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="7174" name="Constant_325504" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7175" name="__module.model.gpt_neox.layers.31.attention/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5006"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="7176" name="Constant_305351" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7177" name="Constant_305356" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7178" name="__module.model.gpt_neox.layers.31.attention/aten::slice/Slice_4" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="5000"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="7179" name="__module.model.gpt_neox.layers.31.attention/aten::cat/Concat_1" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5008"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7180" name="self.model.gpt_neox.layers.31.attention.rotary_emb.sin_cached" type="Const" version="opset1"> + <data element_type="f32" shape="2048, 128" offset="258220060" size="1048576" /> + <output> + <port id="0" precision="FP32" names="self.model.gpt_neox.layers.31.attention.rotary_emb.sin_cached"> + <dim>2048</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7181" name="__module.model.gpt_neox.layers.31.attention.rotary_emb/aten::slice/Unsqueeze_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7182" name="__module.model.gpt_neox.layers.31.attention.rotary_emb/aten::slice/Unsqueeze_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7183" name="__module.model.gpt_neox.layers.31.attention.rotary_emb/aten::slice/Slice_1" type="StridedSlice" version="opset1"> + <data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>2048</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4969,4972,sin.125"> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7184" name="Constant_38416" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="7185" name="__module.model.gpt_neox.layers.31.attention/aten::index/Gather_1" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="4977"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7186" name="__module.model.gpt_neox.layers.31.attention/aten::unsqueeze/Unsqueeze_1" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="4978,sin"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7187" name="__module.model.gpt_neox.layers.31.attention/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5009"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7188" name="__module.model.gpt_neox.layers.31.attention/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5010,5014"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7189" name="__module.model.gpt_neox.layers.31.attention/aten::to/Convert" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.31.key"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7241" name="Constant_305402" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7242" name="Constant_305405" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7243" name="Constant_305408" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7244" name="__module.model.gpt_neox.layers.31.attention/aten::slice/Slice_6" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>384</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4946"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7245" name="Constant_18233" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="4947"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7246" name="__module.model.gpt_neox.layers.31.attention/aten::permute/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4948,query.187"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7247" name="Constant_305414" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7248" name="Constant_305417" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171296" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7249" name="Constant_305420" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7250" name="__module.model.gpt_neox.layers.31.attention/aten::slice/Slice_7" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4955,q"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7251" name="__module.model.gpt_neox.layers.31.attention/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4979"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7252" name="Constant_305424" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7253" name="Constant_305423" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7254" name="__module.model.gpt_neox.layers.31.attention/aten::size/ShapeOf_7" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7255" name="__module.model.gpt_neox.layers.31.attention/aten::size/Constant_7" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="7256" name="__module.model.gpt_neox.layers.31.attention/aten::size/Gather_7" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="4980,4985" /> + </output> + </layer> + <layer id="7257" name="__module.model.gpt_neox.layers.31.attention/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="7258" name="__module.model.gpt_neox.layers.31.attention/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="4982,4983,4987,4988" /> + </output> + </layer> + <layer id="7259" name="Constant_337898" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7260" name="__module.model.gpt_neox.layers.31.attention/aten::slice/Unsqueeze_37" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7261" name="Constant_305422" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7262" name="ScatterUpdate_305425" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7263" name="Constant_305428" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="258220024" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7264" name="Constant_305431" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7265" name="__module.model.gpt_neox.layers.31.attention/aten::slice/Slice_8" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4989,x2.125"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="7266" name="Constant_325505" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="258220056" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7267" name="__module.model.gpt_neox.layers.31.attention/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4990"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="7268" name="Constant_305476" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7269" name="Constant_305481" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7270" name="__module.model.gpt_neox.layers.31.attention/aten::slice/Slice_9" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4984"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="7271" name="__module.model.gpt_neox.layers.31.attention/aten::cat/Concat_4" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4992"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7272" name="__module.model.gpt_neox.layers.31.attention/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4993"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7273" name="__module.model.gpt_neox.layers.31.attention/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4994,5012,5022,query,query.189"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7274" name="__module.model.gpt_neox.layers.31.attention/aten::slice/Slice_11" type="Const" version="opset1"> + <data element_type="boolean" shape="1, 1, 2048, 2048" offset="259268636" size="4194304" /> + <output> + <port id="0" precision="BOOL" names="5031"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="7275" name="Constant_305524" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="7276" name="Constant_305523" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7277" name="ShapeOf_340740" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7278" name="Constant_340741" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="7279" name="Constant_340742" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="7280" name="Gather_340743" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" /> + </output> + </layer> + <layer id="7281" name="ShapeOf_340744" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7282" name="Constant_340745" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="7283" name="Constant_340746" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="7284" name="Gather_340747" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" /> + </output> + </layer> + <layer id="7285" name="Add_340748" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="5026" /> + </output> + </layer> + <layer id="7286" name="ShapeOf_340815" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7287" name="Constant_340816" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="258220008" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="7288" name="Constant_340817" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="7289" name="Gather_340818" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="5024" /> + </output> + </layer> + <layer id="7290" name="__module.model.gpt_neox.layers.31.attention/aten::sub/Subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="5028,5029" /> + </output> + </layer> + <layer id="7291" name="Constant_337900" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7292" name="__module.model.gpt_neox.layers.31.attention/aten::slice/Unsqueeze_44" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7293" name="Constant_305522" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7294" name="ScatterUpdate_305525" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="7295" name="Constant_305526" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462940" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="7296" name="Constant_337902" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7297" name="__module.model.gpt_neox.layers.31.attention/aten::slice/Unsqueeze_45" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7298" name="ScatterUpdate_305527" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="7299" name="Constant_305530" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263462964" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="7300" name="__module.model.gpt_neox.layers.31.attention/aten::slice/Slice_12" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 0" end_mask="1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>2048</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + <port id="2" precision="I64"> + <dim>3</dim> + </port> + <port id="3" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="5032"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + </output> + </layer> + <layer id="7301" name="Constant_305603" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7302" name="Constant_305604" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171264" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7303" name="Constant_305600" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220016" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7304" name="Constant_305599" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="0" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7305" name="ScatterUpdate_305605" type="ScatterUpdate" version="opset3"> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7306" name="Constant_305608" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171328" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7307" name="__module.model.gpt_neox.layers.31.attention/aten::slice/Slice_13" type="StridedSlice" version="opset1"> + <data begin_mask="1, 1, 1, 0" end_mask="1, 1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>2048</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + <port id="3" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="4" precision="BOOL" names="5033,5034"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="7308" name="__module.model.gpt_neox.layers.31.attention/aten::where/Convert_1" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="7309" name="__module.model.gpt_neox.layers.31.attention/aten::full/Convert" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="263462988" size="4" /> + <output> + <port id="0" precision="FP32" names="5021" /> + </output> + </layer> + <layer id="7310" name="__module.model.gpt_neox.layers.31.attention/aten::where/Select" type="Select" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="BOOL"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32" /> + <port id="2" precision="FP32" /> + </input> + <output> + <port id="3" precision="FP32" names="5035,causal_mask.125"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="7311" name="Add_317220" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="7312" name="ShapeOf_317221" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7313" name="Constant_340821" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7314" name="Constant_340822" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="7315" name="Gather_340823" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="5019"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7316" name="Constant_268271" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7317" name="Constant_268273" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7318" name="Constant_268275" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="258220000" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7319" name="__module.model.gpt_neox.layers.31.attention/prim::ListConstruct/Concat_1" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="5036"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7320" name="Maximum_317222" type="Maximum" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7321" name="__module.model.gpt_neox.layers.31.attention/aten::add/Add_2" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5038"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="7322" name="__module.model.gpt_neox.layers.31.attention/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="5039,5040,sdpa_result,tensor.125"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7323" name="Constant_18702" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="257171360" size="32" /> + <output> + <port id="0" precision="I64" names="5041"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7324" name="__module.model.gpt_neox.layers.31.attention/aten::permute/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5042"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7325" name="__module.model.gpt_neox.layers.31.attention/prim::ListConstruct/Concat_2" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="263463020" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="7326" name="__module.model.gpt_neox.layers.31.attention/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>32</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5047"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7327" name="self.model.gpt_neox.layers.31.attention.dense.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 4096" offset="6514618500" size="16777216" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7328" name="Convert_450230" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7329" name="self.model.gpt_neox.layers.31.attention.dense.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="6531395716" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7330" name="Convert_450233" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7331" name="self.model.gpt_neox.layers.31.attention.dense.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7332" name="self.model.gpt_neox.layers.31.attention.dense.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="6531399812" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7333" name="self.model.gpt_neox.layers.31.attention.dense.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7334" name="self.model.gpt_neox.layers.31.attention.dense.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7335" name="__module.model.gpt_neox.layers.31.attention.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7336" name="Constant_325506" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="6531408004" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7337" name="__module.model.gpt_neox.layers.31.attention.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5050,5052,input.127"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7338" name="__module.model.gpt_neox.layers.31/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5056,attn_output"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7339" name="__module.model.gpt_neox.layers.31.post_attention_layernorm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7340" name="__module.model.gpt_neox.layers.31.post_attention_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7341" name="Constant_325507" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="6531424388" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7342" name="__module.model.gpt_neox.layers.31.post_attention_layernorm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7343" name="Constant_325508" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="6531440772" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7344" name="__module.model.gpt_neox.layers.31.post_attention_layernorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5060"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7345" name="self.model.gpt_neox.layers.31.mlp.dense_h_to_4h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 4096" offset="6531457156" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7346" name="Convert_450241" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7347" name="self.model.gpt_neox.layers.31.mlp.dense_h_to_4h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="16384, 1" offset="6598566020" size="16384" /> + <output> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7348" name="Convert_450244" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7349" name="self.model.gpt_neox.layers.31.mlp.dense_h_to_4h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7350" name="self.model.gpt_neox.layers.31.mlp.dense_h_to_4h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="16384, 1" offset="6598582404" size="32768" /> + <output> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7351" name="self.model.gpt_neox.layers.31.mlp.dense_h_to_4h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>16384</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7352" name="self.model.gpt_neox.layers.31.mlp.dense_h_to_4h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7353" name="__module.model.gpt_neox.layers.31.mlp.dense_h_to_4h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>16384</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="7354" name="Constant_325509" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 16384" offset="6598615172" size="65536" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="7355" name="__module.model.gpt_neox.layers.31.mlp.dense_h_to_4h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5065"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="7356" name="__module.model.gpt_neox.layers.31.mlp.act/aten::gelu/Gelu" type="Gelu" version="opset7"> + <data approximation_mode="ERF" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="5066"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="7357" name="self.model.gpt_neox.layers.31.mlp.dense_4h_to_h.weight" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 16384" offset="6598680708" size="67108864" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="7358" name="Convert_450252" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="7359" name="self.model.gpt_neox.layers.31.mlp.dense_4h_to_h.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="4096, 1" offset="6665789572" size="4096" /> + <output> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7360" name="Convert_450255" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7361" name="self.model.gpt_neox.layers.31.mlp.dense_4h_to_h.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="7362" name="self.model.gpt_neox.layers.31.mlp.dense_4h_to_h.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="4096, 1" offset="6665793668" size="8192" /> + <output> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7363" name="self.model.gpt_neox.layers.31.mlp.dense_4h_to_h.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP16"> + <dim>4096</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="7364" name="self.model.gpt_neox.layers.31.mlp.dense_4h_to_h.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </output> + </layer> + <layer id="7365" name="__module.model.gpt_neox.layers.31.mlp.dense_4h_to_h/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>16384</dim> + </port> + <port id="1" precision="FP32"> + <dim>4096</dim> + <dim>16384</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7366" name="Constant_325510" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="6665801860" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7367" name="__module.model.gpt_neox.layers.31.mlp.dense_4h_to_h/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5069,input"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7368" name="__module.model.gpt_neox.layers.31/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5071,5073"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7369" name="__module.model.gpt_neox.final_layer_norm/aten::layer_norm/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="206720796" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7370" name="__module.model.gpt_neox.final_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7371" name="Constant_325511" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="6665818244" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7372" name="__module.model.gpt_neox.final_layer_norm/aten::layer_norm/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7373" name="Constant_325512" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 4096" offset="6665834628" size="16384" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7374" name="__module.model.gpt_neox.final_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5079,5081"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7375" name="self.model.embed_out.weight" type="Const" version="opset1"> + <data element_type="u8" shape="50432, 4096" offset="6665851012" size="206569472" /> + <output> + <port id="0" precision="U8"> + <dim>50432</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7376" name="Convert_450263" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>50432</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>50432</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7377" name="self.model.embed_out.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="50432, 1" offset="6872420484" size="50432" /> + <output> + <port id="0" precision="U8"> + <dim>50432</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7378" name="Convert_450266" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>50432</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>50432</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7379" name="self.model.embed_out.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>50432</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>50432</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>50432</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7380" name="self.model.embed_out.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="50432, 1" offset="6872470916" size="100864" /> + <output> + <port id="0" precision="FP16"> + <dim>50432</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7381" name="self.model.embed_out.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>50432</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP16"> + <dim>50432</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>50432</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7382" name="self.model.embed_out.weight/fq_weights_1/convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="FP16"> + <dim>50432</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>50432</dim> + <dim>4096</dim> + </port> + </output> + </layer> + <layer id="7383" name="__module.model.embed_out/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>4096</dim> + </port> + <port id="1" precision="FP32"> + <dim>50432</dim> + <dim>4096</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="logits"> + <dim>-1</dim> + <dim>-1</dim> + <dim>50432</dim> + </port> + </output> + </layer> + <layer id="7240" name="Assign_417283" type="Assign" version="opset6"> + <data variable_id="past_key_values.0.keypresent.0.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7239" name="Assign_417285" type="Assign" version="opset6"> + <data variable_id="past_key_values.0.valuepresent.0.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7238" name="Assign_417287" type="Assign" version="opset6"> + <data variable_id="past_key_values.1.keypresent.1.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7237" name="Assign_417289" type="Assign" version="opset6"> + <data variable_id="past_key_values.1.valuepresent.1.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7236" name="Assign_417291" type="Assign" version="opset6"> + <data variable_id="past_key_values.10.keypresent.10.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7235" name="Assign_417293" type="Assign" version="opset6"> + <data variable_id="past_key_values.10.valuepresent.10.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7234" name="Assign_417295" type="Assign" version="opset6"> + <data variable_id="past_key_values.11.keypresent.11.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7233" name="Assign_417297" type="Assign" version="opset6"> + <data variable_id="past_key_values.11.valuepresent.11.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7232" name="Assign_417299" type="Assign" version="opset6"> + <data variable_id="past_key_values.12.keypresent.12.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7231" name="Assign_417301" type="Assign" version="opset6"> + <data variable_id="past_key_values.12.valuepresent.12.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7230" name="Assign_417303" type="Assign" version="opset6"> + <data variable_id="past_key_values.13.keypresent.13.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7229" name="Assign_417305" type="Assign" version="opset6"> + <data variable_id="past_key_values.13.valuepresent.13.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7228" name="Assign_417307" type="Assign" version="opset6"> + <data variable_id="past_key_values.14.keypresent.14.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7227" name="Assign_417309" type="Assign" version="opset6"> + <data variable_id="past_key_values.14.valuepresent.14.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7226" name="Assign_417311" type="Assign" version="opset6"> + <data variable_id="past_key_values.15.keypresent.15.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7225" name="Assign_417313" type="Assign" version="opset6"> + <data variable_id="past_key_values.15.valuepresent.15.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7224" name="Assign_417315" type="Assign" version="opset6"> + <data variable_id="past_key_values.16.keypresent.16.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7223" name="Assign_417317" type="Assign" version="opset6"> + <data variable_id="past_key_values.16.valuepresent.16.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7222" name="Assign_417319" type="Assign" version="opset6"> + <data variable_id="past_key_values.17.keypresent.17.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7221" name="Assign_417321" type="Assign" version="opset6"> + <data variable_id="past_key_values.17.valuepresent.17.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7220" name="Assign_417323" type="Assign" version="opset6"> + <data variable_id="past_key_values.18.keypresent.18.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7219" name="Assign_417325" type="Assign" version="opset6"> + <data variable_id="past_key_values.18.valuepresent.18.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7218" name="Assign_417327" type="Assign" version="opset6"> + <data variable_id="past_key_values.19.keypresent.19.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7217" name="Assign_417329" type="Assign" version="opset6"> + <data variable_id="past_key_values.19.valuepresent.19.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7216" name="Assign_417331" type="Assign" version="opset6"> + <data variable_id="past_key_values.2.keypresent.2.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7215" name="Assign_417333" type="Assign" version="opset6"> + <data variable_id="past_key_values.2.valuepresent.2.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7214" name="Assign_417335" type="Assign" version="opset6"> + <data variable_id="past_key_values.20.keypresent.20.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7213" name="Assign_417337" type="Assign" version="opset6"> + <data variable_id="past_key_values.20.valuepresent.20.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7212" name="Assign_417339" type="Assign" version="opset6"> + <data variable_id="past_key_values.21.keypresent.21.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7211" name="Assign_417341" type="Assign" version="opset6"> + <data variable_id="past_key_values.21.valuepresent.21.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7210" name="Assign_417343" type="Assign" version="opset6"> + <data variable_id="past_key_values.22.keypresent.22.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7209" name="Assign_417345" type="Assign" version="opset6"> + <data variable_id="past_key_values.22.valuepresent.22.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7208" name="Assign_417347" type="Assign" version="opset6"> + <data variable_id="past_key_values.23.keypresent.23.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7207" name="Assign_417349" type="Assign" version="opset6"> + <data variable_id="past_key_values.23.valuepresent.23.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7206" name="Assign_417351" type="Assign" version="opset6"> + <data variable_id="past_key_values.24.keypresent.24.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7205" name="Assign_417353" type="Assign" version="opset6"> + <data variable_id="past_key_values.24.valuepresent.24.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7204" name="Assign_417355" type="Assign" version="opset6"> + <data variable_id="past_key_values.25.keypresent.25.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7203" name="Assign_417357" type="Assign" version="opset6"> + <data variable_id="past_key_values.25.valuepresent.25.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7202" name="Assign_417359" type="Assign" version="opset6"> + <data variable_id="past_key_values.26.keypresent.26.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7201" name="Assign_417361" type="Assign" version="opset6"> + <data variable_id="past_key_values.26.valuepresent.26.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7200" name="Assign_417363" type="Assign" version="opset6"> + <data variable_id="past_key_values.27.keypresent.27.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7199" name="Assign_417365" type="Assign" version="opset6"> + <data variable_id="past_key_values.27.valuepresent.27.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7198" name="Assign_417367" type="Assign" version="opset6"> + <data variable_id="past_key_values.28.keypresent.28.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7197" name="Assign_417369" type="Assign" version="opset6"> + <data variable_id="past_key_values.28.valuepresent.28.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7196" name="Assign_417371" type="Assign" version="opset6"> + <data variable_id="past_key_values.29.keypresent.29.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7195" name="Assign_417373" type="Assign" version="opset6"> + <data variable_id="past_key_values.29.valuepresent.29.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7194" name="Assign_417375" type="Assign" version="opset6"> + <data variable_id="past_key_values.3.keypresent.3.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7193" name="Assign_417377" type="Assign" version="opset6"> + <data variable_id="past_key_values.3.valuepresent.3.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7192" name="Assign_417379" type="Assign" version="opset6"> + <data variable_id="past_key_values.30.keypresent.30.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7191" name="Assign_417381" type="Assign" version="opset6"> + <data variable_id="past_key_values.30.valuepresent.30.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7190" name="Assign_417383" type="Assign" version="opset6"> + <data variable_id="past_key_values.31.keypresent.31.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7123" name="Assign_417385" type="Assign" version="opset6"> + <data variable_id="past_key_values.31.valuepresent.31.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2196" name="Assign_417387" type="Assign" version="opset6"> + <data variable_id="past_key_values.4.keypresent.4.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2195" name="Assign_417389" type="Assign" version="opset6"> + <data variable_id="past_key_values.4.valuepresent.4.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2194" name="Assign_417391" type="Assign" version="opset6"> + <data variable_id="past_key_values.5.keypresent.5.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2193" name="Assign_417393" type="Assign" version="opset6"> + <data variable_id="past_key_values.5.valuepresent.5.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2192" name="Assign_417395" type="Assign" version="opset6"> + <data variable_id="past_key_values.6.keypresent.6.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2191" name="Assign_417397" type="Assign" version="opset6"> + <data variable_id="past_key_values.6.valuepresent.6.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2190" name="Assign_417399" type="Assign" version="opset6"> + <data variable_id="past_key_values.7.keypresent.7.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2189" name="Assign_417401" type="Assign" version="opset6"> + <data variable_id="past_key_values.7.valuepresent.7.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2188" name="Assign_417403" type="Assign" version="opset6"> + <data variable_id="past_key_values.8.keypresent.8.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2187" name="Assign_417405" type="Assign" version="opset6"> + <data variable_id="past_key_values.8.valuepresent.8.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2186" name="Assign_417407" type="Assign" version="opset6"> + <data variable_id="past_key_values.9.keypresent.9.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2117" name="Assign_417409" type="Assign" version="opset6"> + <data variable_id="past_key_values.9.valuepresent.9.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>32</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7384" name="Result_140468" type="Result" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>50432</dim> + </port> + </input> + </layer> + </layers> + <edges> + <edge from-layer="0" from-port="0" to-layer="1084" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="1003" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="6009" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="4647" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="6090" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="6236" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="549" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="6317" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="4501" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="6463" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="5863" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="6544" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="6690" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="4420" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="6771" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="6917" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="1230" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="4274" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="6998" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="5409" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="630" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="5101" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="4955" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="776" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="5182" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="3820" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="5328" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="4874" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="160" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="3739" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="4728" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="5555" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="403" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="75" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="5636" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="1992" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="857" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="5782" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="3058" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="3366" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="3285" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="3966" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="3139" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="2458" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="1538" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="1911" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="2604" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="322" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="16" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="2912" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="2205" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="1684" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="1765" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="2685" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="2831" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="3512" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="1457" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="4047" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="3593" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="2377" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="2126" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="1311" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="4193" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="7132" to-port="1" /> + <edge from-layer="1" from-port="0" to-layer="85" to-port="0" /> + <edge from-layer="2" from-port="0" to-layer="208" to-port="0" /> + <edge from-layer="3" from-port="0" to-layer="25" to-port="0" /> + <edge from-layer="3" from-port="0" to-layer="5" to-port="0" /> + <edge from-layer="3" from-port="0" to-layer="202" to-port="0" /> + <edge from-layer="4" from-port="0" to-layer="13" to-port="0" /> + <edge from-layer="5" from-port="1" to-layer="8" to-port="0" /> + <edge from-layer="6" from-port="0" to-layer="8" to-port="1" /> + <edge from-layer="7" from-port="0" to-layer="8" to-port="2" /> + <edge from-layer="8" from-port="3" to-layer="1907" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="4416" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="4724" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="1761" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="4870" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="4189" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="4497" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="1988" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="4951" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="3962" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="2201" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="4270" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="4643" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="4043" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="3362" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="6913" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="2122" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="6994" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="3735" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="7128" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="318" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="2373" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="3589" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="3508" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="6767" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="3281" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="2454" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="3135" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="2600" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="3054" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="2908" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="2681" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="2827" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="5778" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="5178" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="156" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="5324" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="3816" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="5405" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="5551" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="5632" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="399" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="5097" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="5859" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="6005" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="6086" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="6232" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="6313" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="6459" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="6540" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="6686" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="626" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="71" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="545" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="1307" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="1226" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="1453" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="1080" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="999" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="853" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="1534" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="12" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="772" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="1680" to-port="0" /> + <edge from-layer="9" from-port="0" to-layer="12" to-port="1" /> + <edge from-layer="10" from-port="0" to-layer="12" to-port="2" /> + <edge from-layer="11" from-port="0" to-layer="12" to-port="3" /> + <edge from-layer="12" from-port="4" to-layer="13" to-port="1" /> + <edge from-layer="13" from-port="2" to-layer="14" to-port="0" /> + <edge from-layer="14" from-port="1" to-layer="16" to-port="0" /> + <edge from-layer="15" from-port="0" to-layer="16" to-port="2" /> + <edge from-layer="16" from-port="3" to-layer="2116" to-port="0" /> + <edge from-layer="17" from-port="0" to-layer="18" to-port="0" /> + <edge from-layer="18" from-port="1" to-layer="21" to-port="0" /> + <edge from-layer="19" from-port="0" to-layer="20" to-port="0" /> + <edge from-layer="20" from-port="1" to-layer="21" to-port="1" /> + <edge from-layer="21" from-port="2" to-layer="23" to-port="0" /> + <edge from-layer="22" from-port="0" to-layer="23" to-port="1" /> + <edge from-layer="23" from-port="2" to-layer="24" to-port="0" /> + <edge from-layer="24" from-port="1" to-layer="27" to-port="0" /> + <edge from-layer="25" from-port="1" to-layer="27" to-port="1" /> + <edge from-layer="26" from-port="0" to-layer="27" to-port="2" /> + <edge from-layer="27" from-port="3" to-layer="29" to-port="0" /> + <edge from-layer="27" from-port="3" to-layer="244" to-port="1" /> + <edge from-layer="28" from-port="0" to-layer="29" to-port="1" /> + <edge from-layer="29" from-port="2" to-layer="31" to-port="0" /> + <edge from-layer="30" from-port="0" to-layer="31" to-port="1" /> + <edge from-layer="31" from-port="2" to-layer="33" to-port="0" /> + <edge from-layer="32" from-port="0" to-layer="33" to-port="1" /> + <edge from-layer="33" from-port="2" to-layer="42" to-port="0" /> + <edge from-layer="34" from-port="0" to-layer="35" to-port="0" /> + <edge from-layer="35" from-port="1" to-layer="38" to-port="0" /> + <edge from-layer="36" from-port="0" to-layer="37" to-port="0" /> + <edge from-layer="37" from-port="1" to-layer="38" to-port="1" /> + <edge from-layer="38" from-port="2" to-layer="40" to-port="0" /> + <edge from-layer="39" from-port="0" to-layer="40" to-port="1" /> + <edge from-layer="40" from-port="2" to-layer="41" to-port="0" /> + <edge from-layer="41" from-port="1" to-layer="42" to-port="1" /> + <edge from-layer="42" from-port="2" to-layer="44" to-port="0" /> + <edge from-layer="43" from-port="0" to-layer="44" to-port="1" /> + <edge from-layer="44" from-port="2" to-layer="46" to-port="0" /> + <edge from-layer="45" from-port="0" to-layer="46" to-port="1" /> + <edge from-layer="46" from-port="2" to-layer="62" to-port="0" /> + <edge from-layer="46" from-port="2" to-layer="50" to-port="0" /> + <edge from-layer="46" from-port="2" to-layer="164" to-port="0" /> + <edge from-layer="47" from-port="0" to-layer="50" to-port="1" /> + <edge from-layer="48" from-port="0" to-layer="50" to-port="2" /> + <edge from-layer="49" from-port="0" to-layer="50" to-port="3" /> + <edge from-layer="50" from-port="4" to-layer="52" to-port="0" /> + <edge from-layer="51" from-port="0" to-layer="52" to-port="1" /> + <edge from-layer="52" from-port="2" to-layer="56" to-port="0" /> + <edge from-layer="53" from-port="0" to-layer="56" to-port="1" /> + <edge from-layer="54" from-port="0" to-layer="56" to-port="2" /> + <edge from-layer="55" from-port="0" to-layer="56" to-port="3" /> + <edge from-layer="56" from-port="4" to-layer="93" to-port="0" /> + <edge from-layer="56" from-port="4" to-layer="111" to-port="0" /> + <edge from-layer="56" from-port="4" to-layer="106" to-port="0" /> + <edge from-layer="56" from-port="4" to-layer="90" to-port="0" /> + <edge from-layer="57" from-port="0" to-layer="84" to-port="0" /> + <edge from-layer="58" from-port="0" to-layer="84" to-port="1" /> + <edge from-layer="59" from-port="0" to-layer="62" to-port="1" /> + <edge from-layer="60" from-port="0" to-layer="62" to-port="2" /> + <edge from-layer="61" from-port="0" to-layer="62" to-port="3" /> + <edge from-layer="62" from-port="4" to-layer="123" to-port="0" /> + <edge from-layer="62" from-port="4" to-layer="63" to-port="0" /> + <edge from-layer="63" from-port="1" to-layer="66" to-port="0" /> + <edge from-layer="64" from-port="0" to-layer="66" to-port="1" /> + <edge from-layer="65" from-port="0" to-layer="66" to-port="2" /> + <edge from-layer="66" from-port="3" to-layer="82" to-port="0" /> + <edge from-layer="67" from-port="0" to-layer="72" to-port="0" /> + <edge from-layer="68" from-port="0" to-layer="71" to-port="1" /> + <edge from-layer="69" from-port="0" to-layer="71" to-port="2" /> + <edge from-layer="70" from-port="0" to-layer="71" to-port="3" /> + <edge from-layer="71" from-port="4" to-layer="72" to-port="1" /> + <edge from-layer="72" from-port="2" to-layer="73" to-port="0" /> + <edge from-layer="73" from-port="1" to-layer="75" to-port="0" /> + <edge from-layer="74" from-port="0" to-layer="75" to-port="2" /> + <edge from-layer="75" from-port="3" to-layer="151" to-port="0" /> + <edge from-layer="75" from-port="3" to-layer="76" to-port="0" /> + <edge from-layer="76" from-port="1" to-layer="79" to-port="0" /> + <edge from-layer="77" from-port="0" to-layer="79" to-port="1" /> + <edge from-layer="78" from-port="0" to-layer="79" to-port="2" /> + <edge from-layer="79" from-port="3" to-layer="175" to-port="0" /> + <edge from-layer="79" from-port="3" to-layer="81" to-port="0" /> + <edge from-layer="80" from-port="0" to-layer="81" to-port="1" /> + <edge from-layer="81" from-port="2" to-layer="82" to-port="1" /> + <edge from-layer="82" from-port="2" to-layer="116" to-port="2" /> + <edge from-layer="82" from-port="2" to-layer="84" to-port="2" /> + <edge from-layer="83" from-port="0" to-layer="84" to-port="3" /> + <edge from-layer="84" from-port="4" to-layer="87" to-port="0" /> + <edge from-layer="85" from-port="1" to-layer="3296" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="1723" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="2842" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="2870" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="2181" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="3069" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="3097" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="3551" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="3324" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="7157" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="588" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="7185" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="3523" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="2153" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="1241" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="4885" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="787" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="560" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="815" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="4686" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="4658" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="1014" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="1042" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="4459" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="4431" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="4913" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="1269" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="4232" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="4204" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="1468" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="4005" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="1950" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="3977" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="1496" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="1922" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="1695" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="3778" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="6928" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="333" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="6729" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="3750" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="6701" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="6502" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="6474" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="361" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="6275" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="6247" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="6956" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="6048" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="6020" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="5821" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="5793" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="5594" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="5566" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="5367" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="5339" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="5140" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="5112" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="2615" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="2416" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="2388" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="2643" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="87" to-port="1" /> + <edge from-layer="85" from-port="1" to-layer="118" to-port="1" /> + <edge from-layer="86" from-port="0" to-layer="87" to-port="2" /> + <edge from-layer="87" from-port="3" to-layer="89" to-port="0" /> + <edge from-layer="88" from-port="0" to-layer="6276" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="6248" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="362" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="1270" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="1469" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="6475" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="6021" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="6503" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="1497" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="1242" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="3751" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="6702" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="6730" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="1043" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="334" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="6929" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="1015" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="6957" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="816" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="7158" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="561" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="788" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="7186" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="5141" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="1951" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="4006" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="3978" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="4205" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="4233" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="4432" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="4460" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="4659" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="4687" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="4886" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="4914" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="5113" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="3779" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="1923" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="5340" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="5368" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="119" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="5567" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="5595" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="1724" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="5794" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="5822" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="1696" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="2843" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="6049" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="2644" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="3098" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="589" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="3297" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="2389" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="2417" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="3070" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="3552" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="2871" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="3325" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="2182" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="3524" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="89" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="2154" to-port="1" /> + <edge from-layer="88" from-port="0" to-layer="2616" to-port="1" /> + <edge from-layer="89" from-port="2" to-layer="90" to-port="1" /> + <edge from-layer="89" from-port="2" to-layer="128" to-port="1" /> + <edge from-layer="90" from-port="2" to-layer="121" to-port="0" /> + <edge from-layer="91" from-port="0" to-layer="103" to-port="0" /> + <edge from-layer="92" from-port="0" to-layer="103" to-port="1" /> + <edge from-layer="93" from-port="1" to-layer="96" to-port="0" /> + <edge from-layer="94" from-port="0" to-layer="5346" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="6254" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="3339" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="6290" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="5382" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="3076" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="133" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="376" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="1284" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="6481" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="4247" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="6517" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="1248" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="3112" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="1702" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="603" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="5800" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="4020" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="1738" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="3793" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="5836" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="2849" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="5609" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="4211" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="6027" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="5573" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="6063" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="3303" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="1511" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="2885" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="1965" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="1475" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="2431" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="4892" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="4474" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="1057" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="1929" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="1021" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="3530" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="6935" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="2658" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="4665" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="4928" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="6971" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="2160" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="830" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="96" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="794" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="7164" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="3566" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="4701" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="567" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="3984" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="7256" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="5119" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="2622" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="2221" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="6708" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="5155" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="4438" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="2395" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="6744" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="340" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="3757" to-port="1" /> + <edge from-layer="95" from-port="0" to-layer="96" to-port="2" /> + <edge from-layer="96" from-port="3" to-layer="98" to-port="0" /> + <edge from-layer="97" from-port="0" to-layer="3113" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="5156" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="134" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="5574" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="4248" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="1930" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="4021" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="1739" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="5610" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="4702" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="4439" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="2850" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="5383" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="4893" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="5120" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="4666" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="4929" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="3077" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="5347" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="2659" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="2623" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="1966" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="4475" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="2886" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="4212" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="1058" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="1285" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="2161" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="6482" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="1249" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="568" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="3758" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="6518" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="2396" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="6709" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="341" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="6745" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="5801" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="1022" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="3531" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="6936" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="98" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="2222" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="6972" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="831" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="795" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="7165" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="3567" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="7257" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="3340" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="3985" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="5837" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="2432" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="6028" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="1512" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="377" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="6064" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="604" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="3304" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="3794" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="1476" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="6255" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="1703" to-port="1" /> + <edge from-layer="97" from-port="0" to-layer="6291" to-port="1" /> + <edge from-layer="98" from-port="2" to-layer="99" to-port="0" /> + <edge from-layer="99" from-port="1" to-layer="101" to-port="0" /> + <edge from-layer="100" from-port="0" to-layer="101" to-port="1" /> + <edge from-layer="101" from-port="2" to-layer="103" to-port="2" /> + <edge from-layer="102" from-port="0" to-layer="103" to-port="3" /> + <edge from-layer="103" from-port="4" to-layer="106" to-port="1" /> + <edge from-layer="103" from-port="4" to-layer="111" to-port="2" /> + <edge from-layer="104" from-port="0" to-layer="106" to-port="2" /> + <edge from-layer="105" from-port="0" to-layer="106" to-port="3" /> + <edge from-layer="106" from-port="4" to-layer="108" to-port="0" /> + <edge from-layer="107" from-port="0" to-layer="108" to-port="1" /> + <edge from-layer="108" from-port="2" to-layer="112" to-port="0" /> + <edge from-layer="109" from-port="0" to-layer="111" to-port="1" /> + <edge from-layer="110" from-port="0" to-layer="111" to-port="3" /> + <edge from-layer="111" from-port="4" to-layer="112" to-port="1" /> + <edge from-layer="112" from-port="2" to-layer="120" to-port="0" /> + <edge from-layer="113" from-port="0" to-layer="116" to-port="0" /> + <edge from-layer="114" from-port="0" to-layer="116" to-port="1" /> + <edge from-layer="115" from-port="0" to-layer="116" to-port="3" /> + <edge from-layer="116" from-port="4" to-layer="118" to-port="0" /> + <edge from-layer="117" from-port="0" to-layer="118" to-port="2" /> + <edge from-layer="118" from-port="3" to-layer="119" to-port="0" /> + <edge from-layer="119" from-port="2" to-layer="149" to-port="1" /> + <edge from-layer="119" from-port="2" to-layer="120" to-port="1" /> + <edge from-layer="120" from-port="2" to-layer="121" to-port="1" /> + <edge from-layer="121" from-port="2" to-layer="228" to-port="0" /> + <edge from-layer="121" from-port="2" to-layer="176" to-port="0" /> + <edge from-layer="122" from-port="0" to-layer="123" to-port="1" /> + <edge from-layer="123" from-port="2" to-layer="127" to-port="0" /> + <edge from-layer="124" from-port="0" to-layer="127" to-port="1" /> + <edge from-layer="125" from-port="0" to-layer="127" to-port="2" /> + <edge from-layer="126" from-port="0" to-layer="127" to-port="3" /> + <edge from-layer="127" from-port="4" to-layer="142" to-port="0" /> + <edge from-layer="127" from-port="4" to-layer="131" to-port="0" /> + <edge from-layer="127" from-port="4" to-layer="147" to-port="0" /> + <edge from-layer="127" from-port="4" to-layer="128" to-port="0" /> + <edge from-layer="128" from-port="2" to-layer="150" to-port="0" /> + <edge from-layer="129" from-port="0" to-layer="139" to-port="0" /> + <edge from-layer="130" from-port="0" to-layer="139" to-port="1" /> + <edge from-layer="131" from-port="1" to-layer="133" to-port="0" /> + <edge from-layer="132" from-port="0" to-layer="133" to-port="2" /> + <edge from-layer="133" from-port="3" to-layer="134" to-port="0" /> + <edge from-layer="134" from-port="2" to-layer="135" to-port="0" /> + <edge from-layer="135" from-port="1" to-layer="137" to-port="0" /> + <edge from-layer="136" from-port="0" to-layer="137" to-port="1" /> + <edge from-layer="137" from-port="2" to-layer="139" to-port="2" /> + <edge from-layer="138" from-port="0" to-layer="139" to-port="3" /> + <edge from-layer="139" from-port="4" to-layer="142" to-port="1" /> + <edge from-layer="139" from-port="4" to-layer="147" to-port="2" /> + <edge from-layer="140" from-port="0" to-layer="142" to-port="2" /> + <edge from-layer="141" from-port="0" to-layer="142" to-port="3" /> + <edge from-layer="142" from-port="4" to-layer="144" to-port="0" /> + <edge from-layer="143" from-port="0" to-layer="144" to-port="1" /> + <edge from-layer="144" from-port="2" to-layer="148" to-port="0" /> + <edge from-layer="145" from-port="0" to-layer="147" to-port="1" /> + <edge from-layer="146" from-port="0" to-layer="147" to-port="3" /> + <edge from-layer="147" from-port="4" to-layer="148" to-port="1" /> + <edge from-layer="148" from-port="2" to-layer="149" to-port="0" /> + <edge from-layer="149" from-port="2" to-layer="150" to-port="1" /> + <edge from-layer="150" from-port="2" to-layer="151" to-port="1" /> + <edge from-layer="150" from-port="2" to-layer="171" to-port="0" /> + <edge from-layer="151" from-port="2" to-layer="228" to-port="1" /> + <edge from-layer="151" from-port="2" to-layer="7240" to-port="0" /> + <edge from-layer="152" from-port="0" to-layer="157" to-port="0" /> + <edge from-layer="153" from-port="0" to-layer="156" to-port="1" /> + <edge from-layer="154" from-port="0" to-layer="156" to-port="2" /> + <edge from-layer="155" from-port="0" to-layer="156" to-port="3" /> + <edge from-layer="156" from-port="4" to-layer="157" to-port="1" /> + <edge from-layer="157" from-port="2" to-layer="158" to-port="0" /> + <edge from-layer="158" from-port="1" to-layer="160" to-port="0" /> + <edge from-layer="159" from-port="0" to-layer="160" to-port="2" /> + <edge from-layer="160" from-port="3" to-layer="167" to-port="0" /> + <edge from-layer="161" from-port="0" to-layer="164" to-port="1" /> + <edge from-layer="162" from-port="0" to-layer="164" to-port="2" /> + <edge from-layer="163" from-port="0" to-layer="164" to-port="3" /> + <edge from-layer="164" from-port="4" to-layer="166" to-port="0" /> + <edge from-layer="165" from-port="0" to-layer="166" to-port="1" /> + <edge from-layer="166" from-port="2" to-layer="167" to-port="1" /> + <edge from-layer="167" from-port="2" to-layer="7239" to-port="0" /> + <edge from-layer="167" from-port="2" to-layer="228" to-port="2" /> + <edge from-layer="168" from-port="0" to-layer="190" to-port="0" /> + <edge from-layer="169" from-port="0" to-layer="184" to-port="0" /> + <edge from-layer="170" from-port="0" to-layer="184" to-port="1" /> + <edge from-layer="170" from-port="0" to-layer="188" to-port="1" /> + <edge from-layer="171" from-port="1" to-layer="174" to-port="0" /> + <edge from-layer="172" from-port="0" to-layer="174" to-port="1" /> + <edge from-layer="173" from-port="0" to-layer="174" to-port="2" /> + <edge from-layer="174" from-port="3" to-layer="175" to-port="1" /> + <edge from-layer="175" from-port="2" to-layer="180" to-port="0" /> + <edge from-layer="175" from-port="2" to-layer="187" to-port="0" /> + <edge from-layer="176" from-port="1" to-layer="221" to-port="0" /> + <edge from-layer="176" from-port="1" to-layer="179" to-port="0" /> + <edge from-layer="177" from-port="0" to-layer="179" to-port="1" /> + <edge from-layer="178" from-port="0" to-layer="179" to-port="2" /> + <edge from-layer="179" from-port="3" to-layer="180" to-port="1" /> + <edge from-layer="180" from-port="2" to-layer="182" to-port="0" /> + <edge from-layer="181" from-port="0" to-layer="182" to-port="1" /> + <edge from-layer="182" from-port="2" to-layer="184" to-port="2" /> + <edge from-layer="183" from-port="0" to-layer="184" to-port="3" /> + <edge from-layer="183" from-port="0" to-layer="188" to-port="3" /> + <edge from-layer="184" from-port="4" to-layer="190" to-port="1" /> + <edge from-layer="185" from-port="0" to-layer="188" to-port="0" /> + <edge from-layer="186" from-port="0" to-layer="187" to-port="1" /> + <edge from-layer="187" from-port="2" to-layer="188" to-port="2" /> + <edge from-layer="187" from-port="2" to-layer="195" to-port="2" /> + <edge from-layer="188" from-port="4" to-layer="190" to-port="2" /> + <edge from-layer="189" from-port="0" to-layer="190" to-port="3" /> + <edge from-layer="190" from-port="4" to-layer="197" to-port="0" /> + <edge from-layer="191" from-port="0" to-layer="197" to-port="1" /> + <edge from-layer="192" from-port="0" to-layer="195" to-port="0" /> + <edge from-layer="193" from-port="0" to-layer="195" to-port="1" /> + <edge from-layer="194" from-port="0" to-layer="195" to-port="3" /> + <edge from-layer="195" from-port="4" to-layer="197" to-port="2" /> + <edge from-layer="196" from-port="0" to-layer="197" to-port="3" /> + <edge from-layer="197" from-port="4" to-layer="200" to-port="0" /> + <edge from-layer="198" from-port="0" to-layer="200" to-port="1" /> + <edge from-layer="199" from-port="0" to-layer="200" to-port="2" /> + <edge from-layer="200" from-port="3" to-layer="217" to-port="0" /> + <edge from-layer="201" from-port="0" to-layer="214" to-port="0" /> + <edge from-layer="202" from-port="1" to-layer="205" to-port="0" /> + <edge from-layer="203" from-port="0" to-layer="205" to-port="1" /> + <edge from-layer="204" from-port="0" to-layer="205" to-port="2" /> + <edge from-layer="205" from-port="3" to-layer="207" to-port="0" /> + <edge from-layer="206" from-port="0" to-layer="207" to-port="1" /> + <edge from-layer="207" from-port="2" to-layer="208" to-port="1" /> + <edge from-layer="208" from-port="2" to-layer="210" to-port="0" /> + <edge from-layer="209" from-port="0" to-layer="210" to-port="1" /> + <edge from-layer="210" from-port="2" to-layer="211" to-port="0" /> + <edge from-layer="211" from-port="1" to-layer="213" to-port="0" /> + <edge from-layer="212" from-port="0" to-layer="213" to-port="1" /> + <edge from-layer="213" from-port="2" to-layer="214" to-port="1" /> + <edge from-layer="214" from-port="2" to-layer="216" to-port="0" /> + <edge from-layer="215" from-port="0" to-layer="216" to-port="1" /> + <edge from-layer="216" from-port="2" to-layer="7039" to-port="1" /> + <edge from-layer="216" from-port="2" to-layer="7311" to-port="1" /> + <edge from-layer="216" from-port="2" to-layer="3634" to-port="1" /> + <edge from-layer="216" from-port="2" to-layer="671" to-port="1" /> + <edge from-layer="216" from-port="2" to-layer="3407" to-port="1" /> + <edge from-layer="216" from-port="2" to-layer="3180" to-port="1" /> + <edge from-layer="216" from-port="2" to-layer="2499" to-port="1" /> + <edge from-layer="216" from-port="2" to-layer="2953" to-port="1" /> + <edge from-layer="216" from-port="2" to-layer="4088" to-port="1" /> + <edge from-layer="216" from-port="2" to-layer="2272" to-port="1" /> + <edge from-layer="216" from-port="2" to-layer="2033" to-port="1" /> + <edge from-layer="216" from-port="2" to-layer="4315" to-port="1" /> + <edge from-layer="216" from-port="2" to-layer="3861" to-port="1" /> + <edge from-layer="216" from-port="2" to-layer="4542" to-port="1" /> + <edge from-layer="216" from-port="2" to-layer="4769" to-port="1" /> + <edge from-layer="216" from-port="2" to-layer="4996" to-port="1" /> + <edge from-layer="216" from-port="2" to-layer="5223" to-port="1" /> + <edge from-layer="216" from-port="2" to-layer="5450" to-port="1" /> + <edge from-layer="216" from-port="2" to-layer="2726" to-port="1" /> + <edge from-layer="216" from-port="2" to-layer="1806" to-port="1" /> + <edge from-layer="216" from-port="2" to-layer="898" to-port="1" /> + <edge from-layer="216" from-port="2" to-layer="5677" to-port="1" /> + <edge from-layer="216" from-port="2" to-layer="5904" to-port="1" /> + <edge from-layer="216" from-port="2" to-layer="1579" to-port="1" /> + <edge from-layer="216" from-port="2" to-layer="6131" to-port="1" /> + <edge from-layer="216" from-port="2" to-layer="1352" to-port="1" /> + <edge from-layer="216" from-port="2" to-layer="6358" to-port="1" /> + <edge from-layer="216" from-port="2" to-layer="6585" to-port="1" /> + <edge from-layer="216" from-port="2" to-layer="1125" to-port="1" /> + <edge from-layer="216" from-port="2" to-layer="6812" to-port="1" /> + <edge from-layer="216" from-port="2" to-layer="217" to-port="1" /> + <edge from-layer="216" from-port="2" to-layer="444" to-port="1" /> + <edge from-layer="217" from-port="2" to-layer="218" to-port="0" /> + <edge from-layer="217" from-port="2" to-layer="227" to-port="0" /> + <edge from-layer="218" from-port="1" to-layer="226" to-port="0" /> + <edge from-layer="219" from-port="0" to-layer="221" to-port="1" /> + <edge from-layer="220" from-port="0" to-layer="221" to-port="2" /> + <edge from-layer="221" from-port="3" to-layer="225" to-port="0" /> + <edge from-layer="222" from-port="0" to-layer="225" to-port="1" /> + <edge from-layer="223" from-port="0" to-layer="225" to-port="2" /> + <edge from-layer="224" from-port="0" to-layer="225" to-port="3" /> + <edge from-layer="225" from-port="4" to-layer="226" to-port="1" /> + <edge from-layer="226" from-port="2" to-layer="227" to-port="1" /> + <edge from-layer="227" from-port="2" to-layer="228" to-port="3" /> + <edge from-layer="228" from-port="4" to-layer="230" to-port="0" /> + <edge from-layer="229" from-port="0" to-layer="230" to-port="1" /> + <edge from-layer="230" from-port="2" to-layer="232" to-port="0" /> + <edge from-layer="231" from-port="0" to-layer="232" to-port="1" /> + <edge from-layer="232" from-port="2" to-layer="241" to-port="0" /> + <edge from-layer="233" from-port="0" to-layer="234" to-port="0" /> + <edge from-layer="234" from-port="1" to-layer="237" to-port="0" /> + <edge from-layer="235" from-port="0" to-layer="236" to-port="0" /> + <edge from-layer="236" from-port="1" to-layer="237" to-port="1" /> + <edge from-layer="237" from-port="2" to-layer="239" to-port="0" /> + <edge from-layer="238" from-port="0" to-layer="239" to-port="1" /> + <edge from-layer="239" from-port="2" to-layer="240" to-port="0" /> + <edge from-layer="240" from-port="1" to-layer="241" to-port="1" /> + <edge from-layer="241" from-port="2" to-layer="243" to-port="0" /> + <edge from-layer="242" from-port="0" to-layer="243" to-port="1" /> + <edge from-layer="243" from-port="2" to-layer="244" to-port="0" /> + <edge from-layer="244" from-port="2" to-layer="274" to-port="1" /> + <edge from-layer="244" from-port="2" to-layer="246" to-port="0" /> + <edge from-layer="245" from-port="0" to-layer="246" to-port="1" /> + <edge from-layer="246" from-port="2" to-layer="248" to-port="0" /> + <edge from-layer="247" from-port="0" to-layer="248" to-port="1" /> + <edge from-layer="248" from-port="2" to-layer="250" to-port="0" /> + <edge from-layer="249" from-port="0" to-layer="250" to-port="1" /> + <edge from-layer="250" from-port="2" to-layer="259" to-port="0" /> + <edge from-layer="251" from-port="0" to-layer="252" to-port="0" /> + <edge from-layer="252" from-port="1" to-layer="255" to-port="0" /> + <edge from-layer="253" from-port="0" to-layer="254" to-port="0" /> + <edge from-layer="254" from-port="1" to-layer="255" to-port="1" /> + <edge from-layer="255" from-port="2" to-layer="257" to-port="0" /> + <edge from-layer="256" from-port="0" to-layer="257" to-port="1" /> + <edge from-layer="257" from-port="2" to-layer="258" to-port="0" /> + <edge from-layer="258" from-port="1" to-layer="259" to-port="1" /> + <edge from-layer="259" from-port="2" to-layer="261" to-port="0" /> + <edge from-layer="260" from-port="0" to-layer="261" to-port="1" /> + <edge from-layer="261" from-port="2" to-layer="262" to-port="0" /> + <edge from-layer="262" from-port="1" to-layer="271" to-port="0" /> + <edge from-layer="263" from-port="0" to-layer="264" to-port="0" /> + <edge from-layer="264" from-port="1" to-layer="267" to-port="0" /> + <edge from-layer="265" from-port="0" to-layer="266" to-port="0" /> + <edge from-layer="266" from-port="1" to-layer="267" to-port="1" /> + <edge from-layer="267" from-port="2" to-layer="269" to-port="0" /> + <edge from-layer="268" from-port="0" to-layer="269" to-port="1" /> + <edge from-layer="269" from-port="2" to-layer="270" to-port="0" /> + <edge from-layer="270" from-port="1" to-layer="271" to-port="1" /> + <edge from-layer="271" from-port="2" to-layer="273" to-port="0" /> + <edge from-layer="272" from-port="0" to-layer="273" to-port="1" /> + <edge from-layer="273" from-port="2" to-layer="274" to-port="0" /> + <edge from-layer="274" from-port="2" to-layer="471" to-port="1" /> + <edge from-layer="274" from-port="2" to-layer="276" to-port="0" /> + <edge from-layer="275" from-port="0" to-layer="276" to-port="1" /> + <edge from-layer="276" from-port="2" to-layer="278" to-port="0" /> + <edge from-layer="277" from-port="0" to-layer="278" to-port="1" /> + <edge from-layer="278" from-port="2" to-layer="280" to-port="0" /> + <edge from-layer="279" from-port="0" to-layer="280" to-port="1" /> + <edge from-layer="280" from-port="2" to-layer="289" to-port="0" /> + <edge from-layer="281" from-port="0" to-layer="282" to-port="0" /> + <edge from-layer="282" from-port="1" to-layer="285" to-port="0" /> + <edge from-layer="283" from-port="0" to-layer="284" to-port="0" /> + <edge from-layer="284" from-port="1" to-layer="285" to-port="1" /> + <edge from-layer="285" from-port="2" to-layer="287" to-port="0" /> + <edge from-layer="286" from-port="0" to-layer="287" to-port="1" /> + <edge from-layer="287" from-port="2" to-layer="288" to-port="0" /> + <edge from-layer="288" from-port="1" to-layer="289" to-port="1" /> + <edge from-layer="289" from-port="2" to-layer="291" to-port="0" /> + <edge from-layer="290" from-port="0" to-layer="291" to-port="1" /> + <edge from-layer="291" from-port="2" to-layer="293" to-port="0" /> + <edge from-layer="292" from-port="0" to-layer="293" to-port="1" /> + <edge from-layer="293" from-port="2" to-layer="309" to-port="0" /> + <edge from-layer="293" from-port="2" to-layer="407" to-port="0" /> + <edge from-layer="293" from-port="2" to-layer="297" to-port="0" /> + <edge from-layer="294" from-port="0" to-layer="297" to-port="1" /> + <edge from-layer="295" from-port="0" to-layer="297" to-port="2" /> + <edge from-layer="296" from-port="0" to-layer="297" to-port="3" /> + <edge from-layer="297" from-port="4" to-layer="299" to-port="0" /> + <edge from-layer="298" from-port="0" to-layer="299" to-port="1" /> + <edge from-layer="299" from-port="2" to-layer="303" to-port="0" /> + <edge from-layer="300" from-port="0" to-layer="303" to-port="1" /> + <edge from-layer="301" from-port="0" to-layer="303" to-port="2" /> + <edge from-layer="302" from-port="0" to-layer="303" to-port="3" /> + <edge from-layer="303" from-port="4" to-layer="349" to-port="0" /> + <edge from-layer="303" from-port="4" to-layer="354" to-port="0" /> + <edge from-layer="303" from-port="4" to-layer="335" to-port="0" /> + <edge from-layer="303" from-port="4" to-layer="338" to-port="0" /> + <edge from-layer="304" from-port="0" to-layer="331" to-port="0" /> + <edge from-layer="305" from-port="0" to-layer="331" to-port="1" /> + <edge from-layer="306" from-port="0" to-layer="309" to-port="1" /> + <edge from-layer="307" from-port="0" to-layer="309" to-port="2" /> + <edge from-layer="308" from-port="0" to-layer="309" to-port="3" /> + <edge from-layer="309" from-port="4" to-layer="366" to-port="0" /> + <edge from-layer="309" from-port="4" to-layer="310" to-port="0" /> + <edge from-layer="310" from-port="1" to-layer="313" to-port="0" /> + <edge from-layer="311" from-port="0" to-layer="313" to-port="1" /> + <edge from-layer="312" from-port="0" to-layer="313" to-port="2" /> + <edge from-layer="313" from-port="3" to-layer="329" to-port="0" /> + <edge from-layer="314" from-port="0" to-layer="319" to-port="0" /> + <edge from-layer="315" from-port="0" to-layer="318" to-port="1" /> + <edge from-layer="316" from-port="0" to-layer="318" to-port="2" /> + <edge from-layer="317" from-port="0" to-layer="318" to-port="3" /> + <edge from-layer="318" from-port="4" to-layer="319" to-port="1" /> + <edge from-layer="319" from-port="2" to-layer="320" to-port="0" /> + <edge from-layer="320" from-port="1" to-layer="322" to-port="0" /> + <edge from-layer="321" from-port="0" to-layer="322" to-port="2" /> + <edge from-layer="322" from-port="3" to-layer="394" to-port="0" /> + <edge from-layer="322" from-port="3" to-layer="323" to-port="0" /> + <edge from-layer="323" from-port="1" to-layer="326" to-port="0" /> + <edge from-layer="324" from-port="0" to-layer="326" to-port="1" /> + <edge from-layer="325" from-port="0" to-layer="326" to-port="2" /> + <edge from-layer="326" from-port="3" to-layer="328" to-port="0" /> + <edge from-layer="326" from-port="3" to-layer="418" to-port="0" /> + <edge from-layer="327" from-port="0" to-layer="328" to-port="1" /> + <edge from-layer="328" from-port="2" to-layer="329" to-port="1" /> + <edge from-layer="329" from-port="2" to-layer="331" to-port="2" /> + <edge from-layer="329" from-port="2" to-layer="359" to-port="2" /> + <edge from-layer="330" from-port="0" to-layer="331" to-port="3" /> + <edge from-layer="331" from-port="4" to-layer="333" to-port="0" /> + <edge from-layer="332" from-port="0" to-layer="333" to-port="2" /> + <edge from-layer="333" from-port="3" to-layer="334" to-port="0" /> + <edge from-layer="334" from-port="2" to-layer="335" to-port="1" /> + <edge from-layer="334" from-port="2" to-layer="371" to-port="1" /> + <edge from-layer="335" from-port="2" to-layer="364" to-port="0" /> + <edge from-layer="336" from-port="0" to-layer="346" to-port="0" /> + <edge from-layer="337" from-port="0" to-layer="346" to-port="1" /> + <edge from-layer="338" from-port="1" to-layer="340" to-port="0" /> + <edge from-layer="339" from-port="0" to-layer="340" to-port="2" /> + <edge from-layer="340" from-port="3" to-layer="341" to-port="0" /> + <edge from-layer="341" from-port="2" to-layer="342" to-port="0" /> + <edge from-layer="342" from-port="1" to-layer="344" to-port="0" /> + <edge from-layer="343" from-port="0" to-layer="344" to-port="1" /> + <edge from-layer="344" from-port="2" to-layer="346" to-port="2" /> + <edge from-layer="345" from-port="0" to-layer="346" to-port="3" /> + <edge from-layer="346" from-port="4" to-layer="354" to-port="2" /> + <edge from-layer="346" from-port="4" to-layer="349" to-port="1" /> + <edge from-layer="347" from-port="0" to-layer="349" to-port="2" /> + <edge from-layer="348" from-port="0" to-layer="349" to-port="3" /> + <edge from-layer="349" from-port="4" to-layer="351" to-port="0" /> + <edge from-layer="350" from-port="0" to-layer="351" to-port="1" /> + <edge from-layer="351" from-port="2" to-layer="355" to-port="0" /> + <edge from-layer="352" from-port="0" to-layer="354" to-port="1" /> + <edge from-layer="353" from-port="0" to-layer="354" to-port="3" /> + <edge from-layer="354" from-port="4" to-layer="355" to-port="1" /> + <edge from-layer="355" from-port="2" to-layer="363" to-port="0" /> + <edge from-layer="356" from-port="0" to-layer="359" to-port="0" /> + <edge from-layer="357" from-port="0" to-layer="359" to-port="1" /> + <edge from-layer="358" from-port="0" to-layer="359" to-port="3" /> + <edge from-layer="359" from-port="4" to-layer="361" to-port="0" /> + <edge from-layer="360" from-port="0" to-layer="361" to-port="2" /> + <edge from-layer="361" from-port="3" to-layer="362" to-port="0" /> + <edge from-layer="362" from-port="2" to-layer="363" to-port="1" /> + <edge from-layer="362" from-port="2" to-layer="392" to-port="1" /> + <edge from-layer="363" from-port="2" to-layer="364" to-port="1" /> + <edge from-layer="364" from-port="2" to-layer="455" to-port="0" /> + <edge from-layer="364" from-port="2" to-layer="419" to-port="0" /> + <edge from-layer="365" from-port="0" to-layer="366" to-port="1" /> + <edge from-layer="366" from-port="2" to-layer="370" to-port="0" /> + <edge from-layer="367" from-port="0" to-layer="370" to-port="1" /> + <edge from-layer="368" from-port="0" to-layer="370" to-port="2" /> + <edge from-layer="369" from-port="0" to-layer="370" to-port="3" /> + <edge from-layer="370" from-port="4" to-layer="371" to-port="0" /> + <edge from-layer="370" from-port="4" to-layer="385" to-port="0" /> + <edge from-layer="370" from-port="4" to-layer="374" to-port="0" /> + <edge from-layer="370" from-port="4" to-layer="390" to-port="0" /> + <edge from-layer="371" from-port="2" to-layer="393" to-port="0" /> + <edge from-layer="372" from-port="0" to-layer="382" to-port="0" /> + <edge from-layer="373" from-port="0" to-layer="382" to-port="1" /> + <edge from-layer="374" from-port="1" to-layer="376" to-port="0" /> + <edge from-layer="375" from-port="0" to-layer="376" to-port="2" /> + <edge from-layer="376" from-port="3" to-layer="377" to-port="0" /> + <edge from-layer="377" from-port="2" to-layer="378" to-port="0" /> + <edge from-layer="378" from-port="1" to-layer="380" to-port="0" /> + <edge from-layer="379" from-port="0" to-layer="380" to-port="1" /> + <edge from-layer="380" from-port="2" to-layer="382" to-port="2" /> + <edge from-layer="381" from-port="0" to-layer="382" to-port="3" /> + <edge from-layer="382" from-port="4" to-layer="385" to-port="1" /> + <edge from-layer="382" from-port="4" to-layer="390" to-port="2" /> + <edge from-layer="383" from-port="0" to-layer="385" to-port="2" /> + <edge from-layer="384" from-port="0" to-layer="385" to-port="3" /> + <edge from-layer="385" from-port="4" to-layer="387" to-port="0" /> + <edge from-layer="386" from-port="0" to-layer="387" to-port="1" /> + <edge from-layer="387" from-port="2" to-layer="391" to-port="0" /> + <edge from-layer="388" from-port="0" to-layer="390" to-port="1" /> + <edge from-layer="389" from-port="0" to-layer="390" to-port="3" /> + <edge from-layer="390" from-port="4" to-layer="391" to-port="1" /> + <edge from-layer="391" from-port="2" to-layer="392" to-port="0" /> + <edge from-layer="392" from-port="2" to-layer="393" to-port="1" /> + <edge from-layer="393" from-port="2" to-layer="394" to-port="1" /> + <edge from-layer="393" from-port="2" to-layer="414" to-port="0" /> + <edge from-layer="394" from-port="2" to-layer="7238" to-port="0" /> + <edge from-layer="394" from-port="2" to-layer="455" to-port="1" /> + <edge from-layer="395" from-port="0" to-layer="400" to-port="0" /> + <edge from-layer="396" from-port="0" to-layer="399" to-port="1" /> + <edge from-layer="397" from-port="0" to-layer="399" to-port="2" /> + <edge from-layer="398" from-port="0" to-layer="399" to-port="3" /> + <edge from-layer="399" from-port="4" to-layer="400" to-port="1" /> + <edge from-layer="400" from-port="2" to-layer="401" to-port="0" /> + <edge from-layer="401" from-port="1" to-layer="403" to-port="0" /> + <edge from-layer="402" from-port="0" to-layer="403" to-port="2" /> + <edge from-layer="403" from-port="3" to-layer="410" to-port="0" /> + <edge from-layer="404" from-port="0" to-layer="407" to-port="1" /> + <edge from-layer="405" from-port="0" to-layer="407" to-port="2" /> + <edge from-layer="406" from-port="0" to-layer="407" to-port="3" /> + <edge from-layer="407" from-port="4" to-layer="409" to-port="0" /> + <edge from-layer="408" from-port="0" to-layer="409" to-port="1" /> + <edge from-layer="409" from-port="2" to-layer="410" to-port="1" /> + <edge from-layer="410" from-port="2" to-layer="7237" to-port="0" /> + <edge from-layer="410" from-port="2" to-layer="455" to-port="2" /> + <edge from-layer="411" from-port="0" to-layer="433" to-port="0" /> + <edge from-layer="412" from-port="0" to-layer="427" to-port="0" /> + <edge from-layer="413" from-port="0" to-layer="427" to-port="1" /> + <edge from-layer="413" from-port="0" to-layer="431" to-port="1" /> + <edge from-layer="414" from-port="1" to-layer="417" to-port="0" /> + <edge from-layer="415" from-port="0" to-layer="417" to-port="1" /> + <edge from-layer="416" from-port="0" to-layer="417" to-port="2" /> + <edge from-layer="417" from-port="3" to-layer="418" to-port="1" /> + <edge from-layer="418" from-port="2" to-layer="423" to-port="0" /> + <edge from-layer="418" from-port="2" to-layer="430" to-port="0" /> + <edge from-layer="419" from-port="1" to-layer="422" to-port="0" /> + <edge from-layer="419" from-port="1" to-layer="448" to-port="0" /> + <edge from-layer="420" from-port="0" to-layer="422" to-port="1" /> + <edge from-layer="421" from-port="0" to-layer="422" to-port="2" /> + <edge from-layer="422" from-port="3" to-layer="423" to-port="1" /> + <edge from-layer="423" from-port="2" to-layer="425" to-port="0" /> + <edge from-layer="424" from-port="0" to-layer="425" to-port="1" /> + <edge from-layer="425" from-port="2" to-layer="427" to-port="2" /> + <edge from-layer="426" from-port="0" to-layer="427" to-port="3" /> + <edge from-layer="426" from-port="0" to-layer="431" to-port="3" /> + <edge from-layer="427" from-port="4" to-layer="433" to-port="1" /> + <edge from-layer="428" from-port="0" to-layer="431" to-port="0" /> + <edge from-layer="429" from-port="0" to-layer="430" to-port="1" /> + <edge from-layer="430" from-port="2" to-layer="438" to-port="2" /> + <edge from-layer="430" from-port="2" to-layer="431" to-port="2" /> + <edge from-layer="431" from-port="4" to-layer="433" to-port="2" /> + <edge from-layer="432" from-port="0" to-layer="433" to-port="3" /> + <edge from-layer="433" from-port="4" to-layer="440" to-port="0" /> + <edge from-layer="434" from-port="0" to-layer="440" to-port="1" /> + <edge from-layer="435" from-port="0" to-layer="438" to-port="0" /> + <edge from-layer="436" from-port="0" to-layer="438" to-port="1" /> + <edge from-layer="437" from-port="0" to-layer="438" to-port="3" /> + <edge from-layer="438" from-port="4" to-layer="440" to-port="2" /> + <edge from-layer="439" from-port="0" to-layer="440" to-port="3" /> + <edge from-layer="440" from-port="4" to-layer="443" to-port="0" /> + <edge from-layer="441" from-port="0" to-layer="443" to-port="1" /> + <edge from-layer="442" from-port="0" to-layer="443" to-port="2" /> + <edge from-layer="443" from-port="3" to-layer="444" to-port="0" /> + <edge from-layer="444" from-port="2" to-layer="445" to-port="0" /> + <edge from-layer="444" from-port="2" to-layer="454" to-port="0" /> + <edge from-layer="445" from-port="1" to-layer="453" to-port="0" /> + <edge from-layer="446" from-port="0" to-layer="448" to-port="1" /> + <edge from-layer="447" from-port="0" to-layer="448" to-port="2" /> + <edge from-layer="448" from-port="3" to-layer="452" to-port="0" /> + <edge from-layer="449" from-port="0" to-layer="452" to-port="1" /> + <edge from-layer="450" from-port="0" to-layer="452" to-port="2" /> + <edge from-layer="451" from-port="0" to-layer="452" to-port="3" /> + <edge from-layer="452" from-port="4" to-layer="453" to-port="1" /> + <edge from-layer="453" from-port="2" to-layer="454" to-port="1" /> + <edge from-layer="454" from-port="2" to-layer="455" to-port="3" /> + <edge from-layer="455" from-port="4" to-layer="457" to-port="0" /> + <edge from-layer="456" from-port="0" to-layer="457" to-port="1" /> + <edge from-layer="457" from-port="2" to-layer="459" to-port="0" /> + <edge from-layer="458" from-port="0" to-layer="459" to-port="1" /> + <edge from-layer="459" from-port="2" to-layer="468" to-port="0" /> + <edge from-layer="460" from-port="0" to-layer="461" to-port="0" /> + <edge from-layer="461" from-port="1" to-layer="464" to-port="0" /> + <edge from-layer="462" from-port="0" to-layer="463" to-port="0" /> + <edge from-layer="463" from-port="1" to-layer="464" to-port="1" /> + <edge from-layer="464" from-port="2" to-layer="466" to-port="0" /> + <edge from-layer="465" from-port="0" to-layer="466" to-port="1" /> + <edge from-layer="466" from-port="2" to-layer="467" to-port="0" /> + <edge from-layer="467" from-port="1" to-layer="468" to-port="1" /> + <edge from-layer="468" from-port="2" to-layer="470" to-port="0" /> + <edge from-layer="469" from-port="0" to-layer="470" to-port="1" /> + <edge from-layer="470" from-port="2" to-layer="471" to-port="0" /> + <edge from-layer="471" from-port="2" to-layer="473" to-port="0" /> + <edge from-layer="471" from-port="2" to-layer="501" to-port="1" /> + <edge from-layer="472" from-port="0" to-layer="473" to-port="1" /> + <edge from-layer="473" from-port="2" to-layer="475" to-port="0" /> + <edge from-layer="474" from-port="0" to-layer="475" to-port="1" /> + <edge from-layer="475" from-port="2" to-layer="477" to-port="0" /> + <edge from-layer="476" from-port="0" to-layer="477" to-port="1" /> + <edge from-layer="477" from-port="2" to-layer="486" to-port="0" /> + <edge from-layer="478" from-port="0" to-layer="479" to-port="0" /> + <edge from-layer="479" from-port="1" to-layer="482" to-port="0" /> + <edge from-layer="480" from-port="0" to-layer="481" to-port="0" /> + <edge from-layer="481" from-port="1" to-layer="482" to-port="1" /> + <edge from-layer="482" from-port="2" to-layer="484" to-port="0" /> + <edge from-layer="483" from-port="0" to-layer="484" to-port="1" /> + <edge from-layer="484" from-port="2" to-layer="485" to-port="0" /> + <edge from-layer="485" from-port="1" to-layer="486" to-port="1" /> + <edge from-layer="486" from-port="2" to-layer="488" to-port="0" /> + <edge from-layer="487" from-port="0" to-layer="488" to-port="1" /> + <edge from-layer="488" from-port="2" to-layer="489" to-port="0" /> + <edge from-layer="489" from-port="1" to-layer="498" to-port="0" /> + <edge from-layer="490" from-port="0" to-layer="491" to-port="0" /> + <edge from-layer="491" from-port="1" to-layer="494" to-port="0" /> + <edge from-layer="492" from-port="0" to-layer="493" to-port="0" /> + <edge from-layer="493" from-port="1" to-layer="494" to-port="1" /> + <edge from-layer="494" from-port="2" to-layer="496" to-port="0" /> + <edge from-layer="495" from-port="0" to-layer="496" to-port="1" /> + <edge from-layer="496" from-port="2" to-layer="497" to-port="0" /> + <edge from-layer="497" from-port="1" to-layer="498" to-port="1" /> + <edge from-layer="498" from-port="2" to-layer="500" to-port="0" /> + <edge from-layer="499" from-port="0" to-layer="500" to-port="1" /> + <edge from-layer="500" from-port="2" to-layer="501" to-port="0" /> + <edge from-layer="501" from-port="2" to-layer="503" to-port="0" /> + <edge from-layer="501" from-port="2" to-layer="698" to-port="1" /> + <edge from-layer="502" from-port="0" to-layer="503" to-port="1" /> + <edge from-layer="503" from-port="2" to-layer="505" to-port="0" /> + <edge from-layer="504" from-port="0" to-layer="505" to-port="1" /> + <edge from-layer="505" from-port="2" to-layer="507" to-port="0" /> + <edge from-layer="506" from-port="0" to-layer="507" to-port="1" /> + <edge from-layer="507" from-port="2" to-layer="516" to-port="0" /> + <edge from-layer="508" from-port="0" to-layer="509" to-port="0" /> + <edge from-layer="509" from-port="1" to-layer="512" to-port="0" /> + <edge from-layer="510" from-port="0" to-layer="511" to-port="0" /> + <edge from-layer="511" from-port="1" to-layer="512" to-port="1" /> + <edge from-layer="512" from-port="2" to-layer="514" to-port="0" /> + <edge from-layer="513" from-port="0" to-layer="514" to-port="1" /> + <edge from-layer="514" from-port="2" to-layer="515" to-port="0" /> + <edge from-layer="515" from-port="1" to-layer="516" to-port="1" /> + <edge from-layer="516" from-port="2" to-layer="518" to-port="0" /> + <edge from-layer="517" from-port="0" to-layer="518" to-port="1" /> + <edge from-layer="518" from-port="2" to-layer="520" to-port="0" /> + <edge from-layer="519" from-port="0" to-layer="520" to-port="1" /> + <edge from-layer="520" from-port="2" to-layer="536" to-port="0" /> + <edge from-layer="520" from-port="2" to-layer="634" to-port="0" /> + <edge from-layer="520" from-port="2" to-layer="524" to-port="0" /> + <edge from-layer="521" from-port="0" to-layer="524" to-port="1" /> + <edge from-layer="522" from-port="0" to-layer="524" to-port="2" /> + <edge from-layer="523" from-port="0" to-layer="524" to-port="3" /> + <edge from-layer="524" from-port="4" to-layer="526" to-port="0" /> + <edge from-layer="525" from-port="0" to-layer="526" to-port="1" /> + <edge from-layer="526" from-port="2" to-layer="530" to-port="0" /> + <edge from-layer="527" from-port="0" to-layer="530" to-port="1" /> + <edge from-layer="528" from-port="0" to-layer="530" to-port="2" /> + <edge from-layer="529" from-port="0" to-layer="530" to-port="3" /> + <edge from-layer="530" from-port="4" to-layer="562" to-port="0" /> + <edge from-layer="530" from-port="4" to-layer="565" to-port="0" /> + <edge from-layer="530" from-port="4" to-layer="576" to-port="0" /> + <edge from-layer="530" from-port="4" to-layer="581" to-port="0" /> + <edge from-layer="531" from-port="0" to-layer="558" to-port="0" /> + <edge from-layer="532" from-port="0" to-layer="558" to-port="1" /> + <edge from-layer="533" from-port="0" to-layer="536" to-port="1" /> + <edge from-layer="534" from-port="0" to-layer="536" to-port="2" /> + <edge from-layer="535" from-port="0" to-layer="536" to-port="3" /> + <edge from-layer="536" from-port="4" to-layer="593" to-port="0" /> + <edge from-layer="536" from-port="4" to-layer="537" to-port="0" /> + <edge from-layer="537" from-port="1" to-layer="540" to-port="0" /> + <edge from-layer="538" from-port="0" to-layer="540" to-port="1" /> + <edge from-layer="539" from-port="0" to-layer="540" to-port="2" /> + <edge from-layer="540" from-port="3" to-layer="556" to-port="0" /> + <edge from-layer="541" from-port="0" to-layer="546" to-port="0" /> + <edge from-layer="542" from-port="0" to-layer="545" to-port="1" /> + <edge from-layer="543" from-port="0" to-layer="545" to-port="2" /> + <edge from-layer="544" from-port="0" to-layer="545" to-port="3" /> + <edge from-layer="545" from-port="4" to-layer="546" to-port="1" /> + <edge from-layer="546" from-port="2" to-layer="547" to-port="0" /> + <edge from-layer="547" from-port="1" to-layer="549" to-port="0" /> + <edge from-layer="548" from-port="0" to-layer="549" to-port="2" /> + <edge from-layer="549" from-port="3" to-layer="550" to-port="0" /> + <edge from-layer="549" from-port="3" to-layer="621" to-port="0" /> + <edge from-layer="550" from-port="1" to-layer="553" to-port="0" /> + <edge from-layer="551" from-port="0" to-layer="553" to-port="1" /> + <edge from-layer="552" from-port="0" to-layer="553" to-port="2" /> + <edge from-layer="553" from-port="3" to-layer="645" to-port="0" /> + <edge from-layer="553" from-port="3" to-layer="555" to-port="0" /> + <edge from-layer="554" from-port="0" to-layer="555" to-port="1" /> + <edge from-layer="555" from-port="2" to-layer="556" to-port="1" /> + <edge from-layer="556" from-port="2" to-layer="558" to-port="2" /> + <edge from-layer="556" from-port="2" to-layer="586" to-port="2" /> + <edge from-layer="557" from-port="0" to-layer="558" to-port="3" /> + <edge from-layer="558" from-port="4" to-layer="560" to-port="0" /> + <edge from-layer="559" from-port="0" to-layer="560" to-port="2" /> + <edge from-layer="560" from-port="3" to-layer="561" to-port="0" /> + <edge from-layer="561" from-port="2" to-layer="598" to-port="1" /> + <edge from-layer="561" from-port="2" to-layer="562" to-port="1" /> + <edge from-layer="562" from-port="2" to-layer="591" to-port="0" /> + <edge from-layer="563" from-port="0" to-layer="573" to-port="0" /> + <edge from-layer="564" from-port="0" to-layer="573" to-port="1" /> + <edge from-layer="565" from-port="1" to-layer="567" to-port="0" /> + <edge from-layer="566" from-port="0" to-layer="567" to-port="2" /> + <edge from-layer="567" from-port="3" to-layer="568" to-port="0" /> + <edge from-layer="568" from-port="2" to-layer="569" to-port="0" /> + <edge from-layer="569" from-port="1" to-layer="571" to-port="0" /> + <edge from-layer="570" from-port="0" to-layer="571" to-port="1" /> + <edge from-layer="571" from-port="2" to-layer="573" to-port="2" /> + <edge from-layer="572" from-port="0" to-layer="573" to-port="3" /> + <edge from-layer="573" from-port="4" to-layer="576" to-port="1" /> + <edge from-layer="573" from-port="4" to-layer="581" to-port="2" /> + <edge from-layer="574" from-port="0" to-layer="576" to-port="2" /> + <edge from-layer="575" from-port="0" to-layer="576" to-port="3" /> + <edge from-layer="576" from-port="4" to-layer="578" to-port="0" /> + <edge from-layer="577" from-port="0" to-layer="578" to-port="1" /> + <edge from-layer="578" from-port="2" to-layer="582" to-port="0" /> + <edge from-layer="579" from-port="0" to-layer="581" to-port="1" /> + <edge from-layer="580" from-port="0" to-layer="581" to-port="3" /> + <edge from-layer="581" from-port="4" to-layer="582" to-port="1" /> + <edge from-layer="582" from-port="2" to-layer="590" to-port="0" /> + <edge from-layer="583" from-port="0" to-layer="586" to-port="0" /> + <edge from-layer="584" from-port="0" to-layer="586" to-port="1" /> + <edge from-layer="585" from-port="0" to-layer="586" to-port="3" /> + <edge from-layer="586" from-port="4" to-layer="588" to-port="0" /> + <edge from-layer="587" from-port="0" to-layer="588" to-port="2" /> + <edge from-layer="588" from-port="3" to-layer="589" to-port="0" /> + <edge from-layer="589" from-port="2" to-layer="619" to-port="1" /> + <edge from-layer="589" from-port="2" to-layer="590" to-port="1" /> + <edge from-layer="590" from-port="2" to-layer="591" to-port="1" /> + <edge from-layer="591" from-port="2" to-layer="682" to-port="0" /> + <edge from-layer="591" from-port="2" to-layer="646" to-port="0" /> + <edge from-layer="592" from-port="0" to-layer="593" to-port="1" /> + <edge from-layer="593" from-port="2" to-layer="597" to-port="0" /> + <edge from-layer="594" from-port="0" to-layer="597" to-port="1" /> + <edge from-layer="595" from-port="0" to-layer="597" to-port="2" /> + <edge from-layer="596" from-port="0" to-layer="597" to-port="3" /> + <edge from-layer="597" from-port="4" to-layer="598" to-port="0" /> + <edge from-layer="597" from-port="4" to-layer="601" to-port="0" /> + <edge from-layer="597" from-port="4" to-layer="617" to-port="0" /> + <edge from-layer="597" from-port="4" to-layer="612" to-port="0" /> + <edge from-layer="598" from-port="2" to-layer="620" to-port="0" /> + <edge from-layer="599" from-port="0" to-layer="609" to-port="0" /> + <edge from-layer="600" from-port="0" to-layer="609" to-port="1" /> + <edge from-layer="601" from-port="1" to-layer="603" to-port="0" /> + <edge from-layer="602" from-port="0" to-layer="603" to-port="2" /> + <edge from-layer="603" from-port="3" to-layer="604" to-port="0" /> + <edge from-layer="604" from-port="2" to-layer="605" to-port="0" /> + <edge from-layer="605" from-port="1" to-layer="607" to-port="0" /> + <edge from-layer="606" from-port="0" to-layer="607" to-port="1" /> + <edge from-layer="607" from-port="2" to-layer="609" to-port="2" /> + <edge from-layer="608" from-port="0" to-layer="609" to-port="3" /> + <edge from-layer="609" from-port="4" to-layer="612" to-port="1" /> + <edge from-layer="609" from-port="4" to-layer="617" to-port="2" /> + <edge from-layer="610" from-port="0" to-layer="612" to-port="2" /> + <edge from-layer="611" from-port="0" to-layer="612" to-port="3" /> + <edge from-layer="612" from-port="4" to-layer="614" to-port="0" /> + <edge from-layer="613" from-port="0" to-layer="614" to-port="1" /> + <edge from-layer="614" from-port="2" to-layer="618" to-port="0" /> + <edge from-layer="615" from-port="0" to-layer="617" to-port="1" /> + <edge from-layer="616" from-port="0" to-layer="617" to-port="3" /> + <edge from-layer="617" from-port="4" to-layer="618" to-port="1" /> + <edge from-layer="618" from-port="2" to-layer="619" to-port="0" /> + <edge from-layer="619" from-port="2" to-layer="620" to-port="1" /> + <edge from-layer="620" from-port="2" to-layer="621" to-port="1" /> + <edge from-layer="620" from-port="2" to-layer="641" to-port="0" /> + <edge from-layer="621" from-port="2" to-layer="7216" to-port="0" /> + <edge from-layer="621" from-port="2" to-layer="682" to-port="1" /> + <edge from-layer="622" from-port="0" to-layer="627" to-port="0" /> + <edge from-layer="623" from-port="0" to-layer="626" to-port="1" /> + <edge from-layer="624" from-port="0" to-layer="626" to-port="2" /> + <edge from-layer="625" from-port="0" to-layer="626" to-port="3" /> + <edge from-layer="626" from-port="4" to-layer="627" to-port="1" /> + <edge from-layer="627" from-port="2" to-layer="628" to-port="0" /> + <edge from-layer="628" from-port="1" to-layer="630" to-port="0" /> + <edge from-layer="629" from-port="0" to-layer="630" to-port="2" /> + <edge from-layer="630" from-port="3" to-layer="637" to-port="0" /> + <edge from-layer="631" from-port="0" to-layer="634" to-port="1" /> + <edge from-layer="632" from-port="0" to-layer="634" to-port="2" /> + <edge from-layer="633" from-port="0" to-layer="634" to-port="3" /> + <edge from-layer="634" from-port="4" to-layer="636" to-port="0" /> + <edge from-layer="635" from-port="0" to-layer="636" to-port="1" /> + <edge from-layer="636" from-port="2" to-layer="637" to-port="1" /> + <edge from-layer="637" from-port="2" to-layer="7215" to-port="0" /> + <edge from-layer="637" from-port="2" to-layer="682" to-port="2" /> + <edge from-layer="638" from-port="0" to-layer="660" to-port="0" /> + <edge from-layer="639" from-port="0" to-layer="654" to-port="0" /> + <edge from-layer="640" from-port="0" to-layer="658" to-port="1" /> + <edge from-layer="640" from-port="0" to-layer="654" to-port="1" /> + <edge from-layer="641" from-port="1" to-layer="644" to-port="0" /> + <edge from-layer="642" from-port="0" to-layer="644" to-port="1" /> + <edge from-layer="643" from-port="0" to-layer="644" to-port="2" /> + <edge from-layer="644" from-port="3" to-layer="645" to-port="1" /> + <edge from-layer="645" from-port="2" to-layer="650" to-port="0" /> + <edge from-layer="645" from-port="2" to-layer="657" to-port="0" /> + <edge from-layer="646" from-port="1" to-layer="675" to-port="0" /> + <edge from-layer="646" from-port="1" to-layer="649" to-port="0" /> + <edge from-layer="647" from-port="0" to-layer="649" to-port="1" /> + <edge from-layer="648" from-port="0" to-layer="649" to-port="2" /> + <edge from-layer="649" from-port="3" to-layer="650" to-port="1" /> + <edge from-layer="650" from-port="2" to-layer="652" to-port="0" /> + <edge from-layer="651" from-port="0" to-layer="652" to-port="1" /> + <edge from-layer="652" from-port="2" to-layer="654" to-port="2" /> + <edge from-layer="653" from-port="0" to-layer="658" to-port="3" /> + <edge from-layer="653" from-port="0" to-layer="654" to-port="3" /> + <edge from-layer="654" from-port="4" to-layer="660" to-port="1" /> + <edge from-layer="655" from-port="0" to-layer="658" to-port="0" /> + <edge from-layer="656" from-port="0" to-layer="657" to-port="1" /> + <edge from-layer="657" from-port="2" to-layer="665" to-port="2" /> + <edge from-layer="657" from-port="2" to-layer="658" to-port="2" /> + <edge from-layer="658" from-port="4" to-layer="660" to-port="2" /> + <edge from-layer="659" from-port="0" to-layer="660" to-port="3" /> + <edge from-layer="660" from-port="4" to-layer="667" to-port="0" /> + <edge from-layer="661" from-port="0" to-layer="667" to-port="1" /> + <edge from-layer="662" from-port="0" to-layer="665" to-port="0" /> + <edge from-layer="663" from-port="0" to-layer="665" to-port="1" /> + <edge from-layer="664" from-port="0" to-layer="665" to-port="3" /> + <edge from-layer="665" from-port="4" to-layer="667" to-port="2" /> + <edge from-layer="666" from-port="0" to-layer="667" to-port="3" /> + <edge from-layer="667" from-port="4" to-layer="670" to-port="0" /> + <edge from-layer="668" from-port="0" to-layer="670" to-port="1" /> + <edge from-layer="669" from-port="0" to-layer="670" to-port="2" /> + <edge from-layer="670" from-port="3" to-layer="671" to-port="0" /> + <edge from-layer="671" from-port="2" to-layer="681" to-port="0" /> + <edge from-layer="671" from-port="2" to-layer="672" to-port="0" /> + <edge from-layer="672" from-port="1" to-layer="680" to-port="0" /> + <edge from-layer="673" from-port="0" to-layer="675" to-port="1" /> + <edge from-layer="674" from-port="0" to-layer="675" to-port="2" /> + <edge from-layer="675" from-port="3" to-layer="679" to-port="0" /> + <edge from-layer="676" from-port="0" to-layer="679" to-port="1" /> + <edge from-layer="677" from-port="0" to-layer="679" to-port="2" /> + <edge from-layer="678" from-port="0" to-layer="679" to-port="3" /> + <edge from-layer="679" from-port="4" to-layer="680" to-port="1" /> + <edge from-layer="680" from-port="2" to-layer="681" to-port="1" /> + <edge from-layer="681" from-port="2" to-layer="682" to-port="3" /> + <edge from-layer="682" from-port="4" to-layer="684" to-port="0" /> + <edge from-layer="683" from-port="0" to-layer="684" to-port="1" /> + <edge from-layer="684" from-port="2" to-layer="686" to-port="0" /> + <edge from-layer="685" from-port="0" to-layer="686" to-port="1" /> + <edge from-layer="686" from-port="2" to-layer="695" to-port="0" /> + <edge from-layer="687" from-port="0" to-layer="688" to-port="0" /> + <edge from-layer="688" from-port="1" to-layer="691" to-port="0" /> + <edge from-layer="689" from-port="0" to-layer="690" to-port="0" /> + <edge from-layer="690" from-port="1" to-layer="691" to-port="1" /> + <edge from-layer="691" from-port="2" to-layer="693" to-port="0" /> + <edge from-layer="692" from-port="0" to-layer="693" to-port="1" /> + <edge from-layer="693" from-port="2" to-layer="694" to-port="0" /> + <edge from-layer="694" from-port="1" to-layer="695" to-port="1" /> + <edge from-layer="695" from-port="2" to-layer="697" to-port="0" /> + <edge from-layer="696" from-port="0" to-layer="697" to-port="1" /> + <edge from-layer="697" from-port="2" to-layer="698" to-port="0" /> + <edge from-layer="698" from-port="2" to-layer="728" to-port="1" /> + <edge from-layer="698" from-port="2" to-layer="700" to-port="0" /> + <edge from-layer="699" from-port="0" to-layer="700" to-port="1" /> + <edge from-layer="700" from-port="2" to-layer="702" to-port="0" /> + <edge from-layer="701" from-port="0" to-layer="702" to-port="1" /> + <edge from-layer="702" from-port="2" to-layer="704" to-port="0" /> + <edge from-layer="703" from-port="0" to-layer="704" to-port="1" /> + <edge from-layer="704" from-port="2" to-layer="713" to-port="0" /> + <edge from-layer="705" from-port="0" to-layer="706" to-port="0" /> + <edge from-layer="706" from-port="1" to-layer="709" to-port="0" /> + <edge from-layer="707" from-port="0" to-layer="708" to-port="0" /> + <edge from-layer="708" from-port="1" to-layer="709" to-port="1" /> + <edge from-layer="709" from-port="2" to-layer="711" to-port="0" /> + <edge from-layer="710" from-port="0" to-layer="711" to-port="1" /> + <edge from-layer="711" from-port="2" to-layer="712" to-port="0" /> + <edge from-layer="712" from-port="1" to-layer="713" to-port="1" /> + <edge from-layer="713" from-port="2" to-layer="715" to-port="0" /> + <edge from-layer="714" from-port="0" to-layer="715" to-port="1" /> + <edge from-layer="715" from-port="2" to-layer="716" to-port="0" /> + <edge from-layer="716" from-port="1" to-layer="725" to-port="0" /> + <edge from-layer="717" from-port="0" to-layer="718" to-port="0" /> + <edge from-layer="718" from-port="1" to-layer="721" to-port="0" /> + <edge from-layer="719" from-port="0" to-layer="720" to-port="0" /> + <edge from-layer="720" from-port="1" to-layer="721" to-port="1" /> + <edge from-layer="721" from-port="2" to-layer="723" to-port="0" /> + <edge from-layer="722" from-port="0" to-layer="723" to-port="1" /> + <edge from-layer="723" from-port="2" to-layer="724" to-port="0" /> + <edge from-layer="724" from-port="1" to-layer="725" to-port="1" /> + <edge from-layer="725" from-port="2" to-layer="727" to-port="0" /> + <edge from-layer="726" from-port="0" to-layer="727" to-port="1" /> + <edge from-layer="727" from-port="2" to-layer="728" to-port="0" /> + <edge from-layer="728" from-port="2" to-layer="925" to-port="1" /> + <edge from-layer="728" from-port="2" to-layer="730" to-port="0" /> + <edge from-layer="729" from-port="0" to-layer="730" to-port="1" /> + <edge from-layer="730" from-port="2" to-layer="732" to-port="0" /> + <edge from-layer="731" from-port="0" to-layer="732" to-port="1" /> + <edge from-layer="732" from-port="2" to-layer="734" to-port="0" /> + <edge from-layer="733" from-port="0" to-layer="734" to-port="1" /> + <edge from-layer="734" from-port="2" to-layer="743" to-port="0" /> + <edge from-layer="735" from-port="0" to-layer="736" to-port="0" /> + <edge from-layer="736" from-port="1" to-layer="739" to-port="0" /> + <edge from-layer="737" from-port="0" to-layer="738" to-port="0" /> + <edge from-layer="738" from-port="1" to-layer="739" to-port="1" /> + <edge from-layer="739" from-port="2" to-layer="741" to-port="0" /> + <edge from-layer="740" from-port="0" to-layer="741" to-port="1" /> + <edge from-layer="741" from-port="2" to-layer="742" to-port="0" /> + <edge from-layer="742" from-port="1" to-layer="743" to-port="1" /> + <edge from-layer="743" from-port="2" to-layer="745" to-port="0" /> + <edge from-layer="744" from-port="0" to-layer="745" to-port="1" /> + <edge from-layer="745" from-port="2" to-layer="747" to-port="0" /> + <edge from-layer="746" from-port="0" to-layer="747" to-port="1" /> + <edge from-layer="747" from-port="2" to-layer="751" to-port="0" /> + <edge from-layer="747" from-port="2" to-layer="861" to-port="0" /> + <edge from-layer="747" from-port="2" to-layer="763" to-port="0" /> + <edge from-layer="748" from-port="0" to-layer="751" to-port="1" /> + <edge from-layer="749" from-port="0" to-layer="751" to-port="2" /> + <edge from-layer="750" from-port="0" to-layer="751" to-port="3" /> + <edge from-layer="751" from-port="4" to-layer="753" to-port="0" /> + <edge from-layer="752" from-port="0" to-layer="753" to-port="1" /> + <edge from-layer="753" from-port="2" to-layer="757" to-port="0" /> + <edge from-layer="754" from-port="0" to-layer="757" to-port="1" /> + <edge from-layer="755" from-port="0" to-layer="757" to-port="2" /> + <edge from-layer="756" from-port="0" to-layer="757" to-port="3" /> + <edge from-layer="757" from-port="4" to-layer="792" to-port="0" /> + <edge from-layer="757" from-port="4" to-layer="789" to-port="0" /> + <edge from-layer="757" from-port="4" to-layer="803" to-port="0" /> + <edge from-layer="757" from-port="4" to-layer="808" to-port="0" /> + <edge from-layer="758" from-port="0" to-layer="785" to-port="0" /> + <edge from-layer="759" from-port="0" to-layer="785" to-port="1" /> + <edge from-layer="760" from-port="0" to-layer="763" to-port="1" /> + <edge from-layer="761" from-port="0" to-layer="763" to-port="2" /> + <edge from-layer="762" from-port="0" to-layer="763" to-port="3" /> + <edge from-layer="763" from-port="4" to-layer="820" to-port="0" /> + <edge from-layer="763" from-port="4" to-layer="764" to-port="0" /> + <edge from-layer="764" from-port="1" to-layer="767" to-port="0" /> + <edge from-layer="765" from-port="0" to-layer="767" to-port="1" /> + <edge from-layer="766" from-port="0" to-layer="767" to-port="2" /> + <edge from-layer="767" from-port="3" to-layer="783" to-port="0" /> + <edge from-layer="768" from-port="0" to-layer="773" to-port="0" /> + <edge from-layer="769" from-port="0" to-layer="772" to-port="1" /> + <edge from-layer="770" from-port="0" to-layer="772" to-port="2" /> + <edge from-layer="771" from-port="0" to-layer="772" to-port="3" /> + <edge from-layer="772" from-port="4" to-layer="773" to-port="1" /> + <edge from-layer="773" from-port="2" to-layer="774" to-port="0" /> + <edge from-layer="774" from-port="1" to-layer="776" to-port="0" /> + <edge from-layer="775" from-port="0" to-layer="776" to-port="2" /> + <edge from-layer="776" from-port="3" to-layer="848" to-port="0" /> + <edge from-layer="776" from-port="3" to-layer="777" to-port="0" /> + <edge from-layer="777" from-port="1" to-layer="780" to-port="0" /> + <edge from-layer="778" from-port="0" to-layer="780" to-port="1" /> + <edge from-layer="779" from-port="0" to-layer="780" to-port="2" /> + <edge from-layer="780" from-port="3" to-layer="782" to-port="0" /> + <edge from-layer="780" from-port="3" to-layer="872" to-port="0" /> + <edge from-layer="781" from-port="0" to-layer="782" to-port="1" /> + <edge from-layer="782" from-port="2" to-layer="783" to-port="1" /> + <edge from-layer="783" from-port="2" to-layer="785" to-port="2" /> + <edge from-layer="783" from-port="2" to-layer="813" to-port="2" /> + <edge from-layer="784" from-port="0" to-layer="785" to-port="3" /> + <edge from-layer="785" from-port="4" to-layer="787" to-port="0" /> + <edge from-layer="786" from-port="0" to-layer="787" to-port="2" /> + <edge from-layer="787" from-port="3" to-layer="788" to-port="0" /> + <edge from-layer="788" from-port="2" to-layer="789" to-port="1" /> + <edge from-layer="788" from-port="2" to-layer="825" to-port="1" /> + <edge from-layer="789" from-port="2" to-layer="818" to-port="0" /> + <edge from-layer="790" from-port="0" to-layer="800" to-port="0" /> + <edge from-layer="791" from-port="0" to-layer="800" to-port="1" /> + <edge from-layer="792" from-port="1" to-layer="794" to-port="0" /> + <edge from-layer="793" from-port="0" to-layer="794" to-port="2" /> + <edge from-layer="794" from-port="3" to-layer="795" to-port="0" /> + <edge from-layer="795" from-port="2" to-layer="796" to-port="0" /> + <edge from-layer="796" from-port="1" to-layer="798" to-port="0" /> + <edge from-layer="797" from-port="0" to-layer="798" to-port="1" /> + <edge from-layer="798" from-port="2" to-layer="800" to-port="2" /> + <edge from-layer="799" from-port="0" to-layer="800" to-port="3" /> + <edge from-layer="800" from-port="4" to-layer="808" to-port="2" /> + <edge from-layer="800" from-port="4" to-layer="803" to-port="1" /> + <edge from-layer="801" from-port="0" to-layer="803" to-port="2" /> + <edge from-layer="802" from-port="0" to-layer="803" to-port="3" /> + <edge from-layer="803" from-port="4" to-layer="805" to-port="0" /> + <edge from-layer="804" from-port="0" to-layer="805" to-port="1" /> + <edge from-layer="805" from-port="2" to-layer="809" to-port="0" /> + <edge from-layer="806" from-port="0" to-layer="808" to-port="1" /> + <edge from-layer="807" from-port="0" to-layer="808" to-port="3" /> + <edge from-layer="808" from-port="4" to-layer="809" to-port="1" /> + <edge from-layer="809" from-port="2" to-layer="817" to-port="0" /> + <edge from-layer="810" from-port="0" to-layer="813" to-port="0" /> + <edge from-layer="811" from-port="0" to-layer="813" to-port="1" /> + <edge from-layer="812" from-port="0" to-layer="813" to-port="3" /> + <edge from-layer="813" from-port="4" to-layer="815" to-port="0" /> + <edge from-layer="814" from-port="0" to-layer="815" to-port="2" /> + <edge from-layer="815" from-port="3" to-layer="816" to-port="0" /> + <edge from-layer="816" from-port="2" to-layer="846" to-port="1" /> + <edge from-layer="816" from-port="2" to-layer="817" to-port="1" /> + <edge from-layer="817" from-port="2" to-layer="818" to-port="1" /> + <edge from-layer="818" from-port="2" to-layer="873" to-port="0" /> + <edge from-layer="818" from-port="2" to-layer="909" to-port="0" /> + <edge from-layer="819" from-port="0" to-layer="820" to-port="1" /> + <edge from-layer="820" from-port="2" to-layer="824" to-port="0" /> + <edge from-layer="821" from-port="0" to-layer="824" to-port="1" /> + <edge from-layer="822" from-port="0" to-layer="824" to-port="2" /> + <edge from-layer="823" from-port="0" to-layer="824" to-port="3" /> + <edge from-layer="824" from-port="4" to-layer="825" to-port="0" /> + <edge from-layer="824" from-port="4" to-layer="828" to-port="0" /> + <edge from-layer="824" from-port="4" to-layer="839" to-port="0" /> + <edge from-layer="824" from-port="4" to-layer="844" to-port="0" /> + <edge from-layer="825" from-port="2" to-layer="847" to-port="0" /> + <edge from-layer="826" from-port="0" to-layer="836" to-port="0" /> + <edge from-layer="827" from-port="0" to-layer="836" to-port="1" /> + <edge from-layer="828" from-port="1" to-layer="830" to-port="0" /> + <edge from-layer="829" from-port="0" to-layer="830" to-port="2" /> + <edge from-layer="830" from-port="3" to-layer="831" to-port="0" /> + <edge from-layer="831" from-port="2" to-layer="832" to-port="0" /> + <edge from-layer="832" from-port="1" to-layer="834" to-port="0" /> + <edge from-layer="833" from-port="0" to-layer="834" to-port="1" /> + <edge from-layer="834" from-port="2" to-layer="836" to-port="2" /> + <edge from-layer="835" from-port="0" to-layer="836" to-port="3" /> + <edge from-layer="836" from-port="4" to-layer="844" to-port="2" /> + <edge from-layer="836" from-port="4" to-layer="839" to-port="1" /> + <edge from-layer="837" from-port="0" to-layer="839" to-port="2" /> + <edge from-layer="838" from-port="0" to-layer="839" to-port="3" /> + <edge from-layer="839" from-port="4" to-layer="841" to-port="0" /> + <edge from-layer="840" from-port="0" to-layer="841" to-port="1" /> + <edge from-layer="841" from-port="2" to-layer="845" to-port="0" /> + <edge from-layer="842" from-port="0" to-layer="844" to-port="1" /> + <edge from-layer="843" from-port="0" to-layer="844" to-port="3" /> + <edge from-layer="844" from-port="4" to-layer="845" to-port="1" /> + <edge from-layer="845" from-port="2" to-layer="846" to-port="0" /> + <edge from-layer="846" from-port="2" to-layer="847" to-port="1" /> + <edge from-layer="847" from-port="2" to-layer="868" to-port="0" /> + <edge from-layer="847" from-port="2" to-layer="848" to-port="1" /> + <edge from-layer="848" from-port="2" to-layer="909" to-port="1" /> + <edge from-layer="848" from-port="2" to-layer="7194" to-port="0" /> + <edge from-layer="849" from-port="0" to-layer="854" to-port="0" /> + <edge from-layer="850" from-port="0" to-layer="853" to-port="1" /> + <edge from-layer="851" from-port="0" to-layer="853" to-port="2" /> + <edge from-layer="852" from-port="0" to-layer="853" to-port="3" /> + <edge from-layer="853" from-port="4" to-layer="854" to-port="1" /> + <edge from-layer="854" from-port="2" to-layer="855" to-port="0" /> + <edge from-layer="855" from-port="1" to-layer="857" to-port="0" /> + <edge from-layer="856" from-port="0" to-layer="857" to-port="2" /> + <edge from-layer="857" from-port="3" to-layer="864" to-port="0" /> + <edge from-layer="858" from-port="0" to-layer="861" to-port="1" /> + <edge from-layer="859" from-port="0" to-layer="861" to-port="2" /> + <edge from-layer="860" from-port="0" to-layer="861" to-port="3" /> + <edge from-layer="861" from-port="4" to-layer="863" to-port="0" /> + <edge from-layer="862" from-port="0" to-layer="863" to-port="1" /> + <edge from-layer="863" from-port="2" to-layer="864" to-port="1" /> + <edge from-layer="864" from-port="2" to-layer="7193" to-port="0" /> + <edge from-layer="864" from-port="2" to-layer="909" to-port="2" /> + <edge from-layer="865" from-port="0" to-layer="887" to-port="0" /> + <edge from-layer="866" from-port="0" to-layer="881" to-port="0" /> + <edge from-layer="867" from-port="0" to-layer="885" to-port="1" /> + <edge from-layer="867" from-port="0" to-layer="881" to-port="1" /> + <edge from-layer="868" from-port="1" to-layer="871" to-port="0" /> + <edge from-layer="869" from-port="0" to-layer="871" to-port="1" /> + <edge from-layer="870" from-port="0" to-layer="871" to-port="2" /> + <edge from-layer="871" from-port="3" to-layer="872" to-port="1" /> + <edge from-layer="872" from-port="2" to-layer="884" to-port="0" /> + <edge from-layer="872" from-port="2" to-layer="877" to-port="0" /> + <edge from-layer="873" from-port="1" to-layer="902" to-port="0" /> + <edge from-layer="873" from-port="1" to-layer="876" to-port="0" /> + <edge from-layer="874" from-port="0" to-layer="876" to-port="1" /> + <edge from-layer="875" from-port="0" to-layer="876" to-port="2" /> + <edge from-layer="876" from-port="3" to-layer="877" to-port="1" /> + <edge from-layer="877" from-port="2" to-layer="879" to-port="0" /> + <edge from-layer="878" from-port="0" to-layer="879" to-port="1" /> + <edge from-layer="879" from-port="2" to-layer="881" to-port="2" /> + <edge from-layer="880" from-port="0" to-layer="885" to-port="3" /> + <edge from-layer="880" from-port="0" to-layer="881" to-port="3" /> + <edge from-layer="881" from-port="4" to-layer="887" to-port="1" /> + <edge from-layer="882" from-port="0" to-layer="885" to-port="0" /> + <edge from-layer="883" from-port="0" to-layer="884" to-port="1" /> + <edge from-layer="884" from-port="2" to-layer="892" to-port="2" /> + <edge from-layer="884" from-port="2" to-layer="885" to-port="2" /> + <edge from-layer="885" from-port="4" to-layer="887" to-port="2" /> + <edge from-layer="886" from-port="0" to-layer="887" to-port="3" /> + <edge from-layer="887" from-port="4" to-layer="894" to-port="0" /> + <edge from-layer="888" from-port="0" to-layer="894" to-port="1" /> + <edge from-layer="889" from-port="0" to-layer="892" to-port="0" /> + <edge from-layer="890" from-port="0" to-layer="892" to-port="1" /> + <edge from-layer="891" from-port="0" to-layer="892" to-port="3" /> + <edge from-layer="892" from-port="4" to-layer="894" to-port="2" /> + <edge from-layer="893" from-port="0" to-layer="894" to-port="3" /> + <edge from-layer="894" from-port="4" to-layer="897" to-port="0" /> + <edge from-layer="895" from-port="0" to-layer="897" to-port="1" /> + <edge from-layer="896" from-port="0" to-layer="897" to-port="2" /> + <edge from-layer="897" from-port="3" to-layer="898" to-port="0" /> + <edge from-layer="898" from-port="2" to-layer="908" to-port="0" /> + <edge from-layer="898" from-port="2" to-layer="899" to-port="0" /> + <edge from-layer="899" from-port="1" to-layer="907" to-port="0" /> + <edge from-layer="900" from-port="0" to-layer="902" to-port="1" /> + <edge from-layer="901" from-port="0" to-layer="902" to-port="2" /> + <edge from-layer="902" from-port="3" to-layer="906" to-port="0" /> + <edge from-layer="903" from-port="0" to-layer="906" to-port="1" /> + <edge from-layer="904" from-port="0" to-layer="906" to-port="2" /> + <edge from-layer="905" from-port="0" to-layer="906" to-port="3" /> + <edge from-layer="906" from-port="4" to-layer="907" to-port="1" /> + <edge from-layer="907" from-port="2" to-layer="908" to-port="1" /> + <edge from-layer="908" from-port="2" to-layer="909" to-port="3" /> + <edge from-layer="909" from-port="4" to-layer="911" to-port="0" /> + <edge from-layer="910" from-port="0" to-layer="911" to-port="1" /> + <edge from-layer="911" from-port="2" to-layer="913" to-port="0" /> + <edge from-layer="912" from-port="0" to-layer="913" to-port="1" /> + <edge from-layer="913" from-port="2" to-layer="922" to-port="0" /> + <edge from-layer="914" from-port="0" to-layer="915" to-port="0" /> + <edge from-layer="915" from-port="1" to-layer="918" to-port="0" /> + <edge from-layer="916" from-port="0" to-layer="917" to-port="0" /> + <edge from-layer="917" from-port="1" to-layer="918" to-port="1" /> + <edge from-layer="918" from-port="2" to-layer="920" to-port="0" /> + <edge from-layer="919" from-port="0" to-layer="920" to-port="1" /> + <edge from-layer="920" from-port="2" to-layer="921" to-port="0" /> + <edge from-layer="921" from-port="1" to-layer="922" to-port="1" /> + <edge from-layer="922" from-port="2" to-layer="924" to-port="0" /> + <edge from-layer="923" from-port="0" to-layer="924" to-port="1" /> + <edge from-layer="924" from-port="2" to-layer="925" to-port="0" /> + <edge from-layer="925" from-port="2" to-layer="955" to-port="1" /> + <edge from-layer="925" from-port="2" to-layer="927" to-port="0" /> + <edge from-layer="926" from-port="0" to-layer="927" to-port="1" /> + <edge from-layer="927" from-port="2" to-layer="929" to-port="0" /> + <edge from-layer="928" from-port="0" to-layer="929" to-port="1" /> + <edge from-layer="929" from-port="2" to-layer="931" to-port="0" /> + <edge from-layer="930" from-port="0" to-layer="931" to-port="1" /> + <edge from-layer="931" from-port="2" to-layer="940" to-port="0" /> + <edge from-layer="932" from-port="0" to-layer="933" to-port="0" /> + <edge from-layer="933" from-port="1" to-layer="936" to-port="0" /> + <edge from-layer="934" from-port="0" to-layer="935" to-port="0" /> + <edge from-layer="935" from-port="1" to-layer="936" to-port="1" /> + <edge from-layer="936" from-port="2" to-layer="938" to-port="0" /> + <edge from-layer="937" from-port="0" to-layer="938" to-port="1" /> + <edge from-layer="938" from-port="2" to-layer="939" to-port="0" /> + <edge from-layer="939" from-port="1" to-layer="940" to-port="1" /> + <edge from-layer="940" from-port="2" to-layer="942" to-port="0" /> + <edge from-layer="941" from-port="0" to-layer="942" to-port="1" /> + <edge from-layer="942" from-port="2" to-layer="943" to-port="0" /> + <edge from-layer="943" from-port="1" to-layer="952" to-port="0" /> + <edge from-layer="944" from-port="0" to-layer="945" to-port="0" /> + <edge from-layer="945" from-port="1" to-layer="948" to-port="0" /> + <edge from-layer="946" from-port="0" to-layer="947" to-port="0" /> + <edge from-layer="947" from-port="1" to-layer="948" to-port="1" /> + <edge from-layer="948" from-port="2" to-layer="950" to-port="0" /> + <edge from-layer="949" from-port="0" to-layer="950" to-port="1" /> + <edge from-layer="950" from-port="2" to-layer="951" to-port="0" /> + <edge from-layer="951" from-port="1" to-layer="952" to-port="1" /> + <edge from-layer="952" from-port="2" to-layer="954" to-port="0" /> + <edge from-layer="953" from-port="0" to-layer="954" to-port="1" /> + <edge from-layer="954" from-port="2" to-layer="955" to-port="0" /> + <edge from-layer="955" from-port="2" to-layer="957" to-port="0" /> + <edge from-layer="955" from-port="2" to-layer="1152" to-port="1" /> + <edge from-layer="956" from-port="0" to-layer="957" to-port="1" /> + <edge from-layer="957" from-port="2" to-layer="959" to-port="0" /> + <edge from-layer="958" from-port="0" to-layer="959" to-port="1" /> + <edge from-layer="959" from-port="2" to-layer="961" to-port="0" /> + <edge from-layer="960" from-port="0" to-layer="961" to-port="1" /> + <edge from-layer="961" from-port="2" to-layer="970" to-port="0" /> + <edge from-layer="962" from-port="0" to-layer="963" to-port="0" /> + <edge from-layer="963" from-port="1" to-layer="966" to-port="0" /> + <edge from-layer="964" from-port="0" to-layer="965" to-port="0" /> + <edge from-layer="965" from-port="1" to-layer="966" to-port="1" /> + <edge from-layer="966" from-port="2" to-layer="968" to-port="0" /> + <edge from-layer="967" from-port="0" to-layer="968" to-port="1" /> + <edge from-layer="968" from-port="2" to-layer="969" to-port="0" /> + <edge from-layer="969" from-port="1" to-layer="970" to-port="1" /> + <edge from-layer="970" from-port="2" to-layer="972" to-port="0" /> + <edge from-layer="971" from-port="0" to-layer="972" to-port="1" /> + <edge from-layer="972" from-port="2" to-layer="974" to-port="0" /> + <edge from-layer="973" from-port="0" to-layer="974" to-port="1" /> + <edge from-layer="974" from-port="2" to-layer="978" to-port="0" /> + <edge from-layer="974" from-port="2" to-layer="1088" to-port="0" /> + <edge from-layer="974" from-port="2" to-layer="990" to-port="0" /> + <edge from-layer="975" from-port="0" to-layer="978" to-port="1" /> + <edge from-layer="976" from-port="0" to-layer="978" to-port="2" /> + <edge from-layer="977" from-port="0" to-layer="978" to-port="3" /> + <edge from-layer="978" from-port="4" to-layer="980" to-port="0" /> + <edge from-layer="979" from-port="0" to-layer="980" to-port="1" /> + <edge from-layer="980" from-port="2" to-layer="984" to-port="0" /> + <edge from-layer="981" from-port="0" to-layer="984" to-port="1" /> + <edge from-layer="982" from-port="0" to-layer="984" to-port="2" /> + <edge from-layer="983" from-port="0" to-layer="984" to-port="3" /> + <edge from-layer="984" from-port="4" to-layer="1035" to-port="0" /> + <edge from-layer="984" from-port="4" to-layer="1030" to-port="0" /> + <edge from-layer="984" from-port="4" to-layer="1019" to-port="0" /> + <edge from-layer="984" from-port="4" to-layer="1016" to-port="0" /> + <edge from-layer="985" from-port="0" to-layer="1012" to-port="0" /> + <edge from-layer="986" from-port="0" to-layer="1012" to-port="1" /> + <edge from-layer="987" from-port="0" to-layer="990" to-port="1" /> + <edge from-layer="988" from-port="0" to-layer="990" to-port="2" /> + <edge from-layer="989" from-port="0" to-layer="990" to-port="3" /> + <edge from-layer="990" from-port="4" to-layer="1047" to-port="0" /> + <edge from-layer="990" from-port="4" to-layer="991" to-port="0" /> + <edge from-layer="991" from-port="1" to-layer="994" to-port="0" /> + <edge from-layer="992" from-port="0" to-layer="994" to-port="1" /> + <edge from-layer="993" from-port="0" to-layer="994" to-port="2" /> + <edge from-layer="994" from-port="3" to-layer="1010" to-port="0" /> + <edge from-layer="995" from-port="0" to-layer="1000" to-port="0" /> + <edge from-layer="996" from-port="0" to-layer="999" to-port="1" /> + <edge from-layer="997" from-port="0" to-layer="999" to-port="2" /> + <edge from-layer="998" from-port="0" to-layer="999" to-port="3" /> + <edge from-layer="999" from-port="4" to-layer="1000" to-port="1" /> + <edge from-layer="1000" from-port="2" to-layer="1001" to-port="0" /> + <edge from-layer="1001" from-port="1" to-layer="1003" to-port="0" /> + <edge from-layer="1002" from-port="0" to-layer="1003" to-port="2" /> + <edge from-layer="1003" from-port="3" to-layer="1004" to-port="0" /> + <edge from-layer="1003" from-port="3" to-layer="1075" to-port="0" /> + <edge from-layer="1004" from-port="1" to-layer="1007" to-port="0" /> + <edge from-layer="1005" from-port="0" to-layer="1007" to-port="1" /> + <edge from-layer="1006" from-port="0" to-layer="1007" to-port="2" /> + <edge from-layer="1007" from-port="3" to-layer="1009" to-port="0" /> + <edge from-layer="1007" from-port="3" to-layer="1099" to-port="0" /> + <edge from-layer="1008" from-port="0" to-layer="1009" to-port="1" /> + <edge from-layer="1009" from-port="2" to-layer="1010" to-port="1" /> + <edge from-layer="1010" from-port="2" to-layer="1040" to-port="2" /> + <edge from-layer="1010" from-port="2" to-layer="1012" to-port="2" /> + <edge from-layer="1011" from-port="0" to-layer="1012" to-port="3" /> + <edge from-layer="1012" from-port="4" to-layer="1014" to-port="0" /> + <edge from-layer="1013" from-port="0" to-layer="1014" to-port="2" /> + <edge from-layer="1014" from-port="3" to-layer="1015" to-port="0" /> + <edge from-layer="1015" from-port="2" to-layer="1052" to-port="1" /> + <edge from-layer="1015" from-port="2" to-layer="1016" to-port="1" /> + <edge from-layer="1016" from-port="2" to-layer="1045" to-port="0" /> + <edge from-layer="1017" from-port="0" to-layer="1027" to-port="0" /> + <edge from-layer="1018" from-port="0" to-layer="1027" to-port="1" /> + <edge from-layer="1019" from-port="1" to-layer="1021" to-port="0" /> + <edge from-layer="1020" from-port="0" to-layer="1021" to-port="2" /> + <edge from-layer="1021" from-port="3" to-layer="1022" to-port="0" /> + <edge from-layer="1022" from-port="2" to-layer="1023" to-port="0" /> + <edge from-layer="1023" from-port="1" to-layer="1025" to-port="0" /> + <edge from-layer="1024" from-port="0" to-layer="1025" to-port="1" /> + <edge from-layer="1025" from-port="2" to-layer="1027" to-port="2" /> + <edge from-layer="1026" from-port="0" to-layer="1027" to-port="3" /> + <edge from-layer="1027" from-port="4" to-layer="1030" to-port="1" /> + <edge from-layer="1027" from-port="4" to-layer="1035" to-port="2" /> + <edge from-layer="1028" from-port="0" to-layer="1030" to-port="2" /> + <edge from-layer="1029" from-port="0" to-layer="1030" to-port="3" /> + <edge from-layer="1030" from-port="4" to-layer="1032" to-port="0" /> + <edge from-layer="1031" from-port="0" to-layer="1032" to-port="1" /> + <edge from-layer="1032" from-port="2" to-layer="1036" to-port="0" /> + <edge from-layer="1033" from-port="0" to-layer="1035" to-port="1" /> + <edge from-layer="1034" from-port="0" to-layer="1035" to-port="3" /> + <edge from-layer="1035" from-port="4" to-layer="1036" to-port="1" /> + <edge from-layer="1036" from-port="2" to-layer="1044" to-port="0" /> + <edge from-layer="1037" from-port="0" to-layer="1040" to-port="0" /> + <edge from-layer="1038" from-port="0" to-layer="1040" to-port="1" /> + <edge from-layer="1039" from-port="0" to-layer="1040" to-port="3" /> + <edge from-layer="1040" from-port="4" to-layer="1042" to-port="0" /> + <edge from-layer="1041" from-port="0" to-layer="1042" to-port="2" /> + <edge from-layer="1042" from-port="3" to-layer="1043" to-port="0" /> + <edge from-layer="1043" from-port="2" to-layer="1073" to-port="1" /> + <edge from-layer="1043" from-port="2" to-layer="1044" to-port="1" /> + <edge from-layer="1044" from-port="2" to-layer="1045" to-port="1" /> + <edge from-layer="1045" from-port="2" to-layer="1136" to-port="0" /> + <edge from-layer="1045" from-port="2" to-layer="1100" to-port="0" /> + <edge from-layer="1046" from-port="0" to-layer="1047" to-port="1" /> + <edge from-layer="1047" from-port="2" to-layer="1051" to-port="0" /> + <edge from-layer="1048" from-port="0" to-layer="1051" to-port="1" /> + <edge from-layer="1049" from-port="0" to-layer="1051" to-port="2" /> + <edge from-layer="1050" from-port="0" to-layer="1051" to-port="3" /> + <edge from-layer="1051" from-port="4" to-layer="1052" to-port="0" /> + <edge from-layer="1051" from-port="4" to-layer="1071" to-port="0" /> + <edge from-layer="1051" from-port="4" to-layer="1066" to-port="0" /> + <edge from-layer="1051" from-port="4" to-layer="1055" to-port="0" /> + <edge from-layer="1052" from-port="2" to-layer="1074" to-port="0" /> + <edge from-layer="1053" from-port="0" to-layer="1063" to-port="0" /> + <edge from-layer="1054" from-port="0" to-layer="1063" to-port="1" /> + <edge from-layer="1055" from-port="1" to-layer="1057" to-port="0" /> + <edge from-layer="1056" from-port="0" to-layer="1057" to-port="2" /> + <edge from-layer="1057" from-port="3" to-layer="1058" to-port="0" /> + <edge from-layer="1058" from-port="2" to-layer="1059" to-port="0" /> + <edge from-layer="1059" from-port="1" to-layer="1061" to-port="0" /> + <edge from-layer="1060" from-port="0" to-layer="1061" to-port="1" /> + <edge from-layer="1061" from-port="2" to-layer="1063" to-port="2" /> + <edge from-layer="1062" from-port="0" to-layer="1063" to-port="3" /> + <edge from-layer="1063" from-port="4" to-layer="1066" to-port="1" /> + <edge from-layer="1063" from-port="4" to-layer="1071" to-port="2" /> + <edge from-layer="1064" from-port="0" to-layer="1066" to-port="2" /> + <edge from-layer="1065" from-port="0" to-layer="1066" to-port="3" /> + <edge from-layer="1066" from-port="4" to-layer="1068" to-port="0" /> + <edge from-layer="1067" from-port="0" to-layer="1068" to-port="1" /> + <edge from-layer="1068" from-port="2" to-layer="1072" to-port="0" /> + <edge from-layer="1069" from-port="0" to-layer="1071" to-port="1" /> + <edge from-layer="1070" from-port="0" to-layer="1071" to-port="3" /> + <edge from-layer="1071" from-port="4" to-layer="1072" to-port="1" /> + <edge from-layer="1072" from-port="2" to-layer="1073" to-port="0" /> + <edge from-layer="1073" from-port="2" to-layer="1074" to-port="1" /> + <edge from-layer="1074" from-port="2" to-layer="1075" to-port="1" /> + <edge from-layer="1074" from-port="2" to-layer="1095" to-port="0" /> + <edge from-layer="1075" from-port="2" to-layer="2196" to-port="0" /> + <edge from-layer="1075" from-port="2" to-layer="1136" to-port="1" /> + <edge from-layer="1076" from-port="0" to-layer="1081" to-port="0" /> + <edge from-layer="1077" from-port="0" to-layer="1080" to-port="1" /> + <edge from-layer="1078" from-port="0" to-layer="1080" to-port="2" /> + <edge from-layer="1079" from-port="0" to-layer="1080" to-port="3" /> + <edge from-layer="1080" from-port="4" to-layer="1081" to-port="1" /> + <edge from-layer="1081" from-port="2" to-layer="1082" to-port="0" /> + <edge from-layer="1082" from-port="1" to-layer="1084" to-port="0" /> + <edge from-layer="1083" from-port="0" to-layer="1084" to-port="2" /> + <edge from-layer="1084" from-port="3" to-layer="1091" to-port="0" /> + <edge from-layer="1085" from-port="0" to-layer="1088" to-port="1" /> + <edge from-layer="1086" from-port="0" to-layer="1088" to-port="2" /> + <edge from-layer="1087" from-port="0" to-layer="1088" to-port="3" /> + <edge from-layer="1088" from-port="4" to-layer="1090" to-port="0" /> + <edge from-layer="1089" from-port="0" to-layer="1090" to-port="1" /> + <edge from-layer="1090" from-port="2" to-layer="1091" to-port="1" /> + <edge from-layer="1091" from-port="2" to-layer="1136" to-port="2" /> + <edge from-layer="1091" from-port="2" to-layer="2195" to-port="0" /> + <edge from-layer="1092" from-port="0" to-layer="1114" to-port="0" /> + <edge from-layer="1093" from-port="0" to-layer="1108" to-port="0" /> + <edge from-layer="1094" from-port="0" to-layer="1108" to-port="1" /> + <edge from-layer="1094" from-port="0" to-layer="1112" to-port="1" /> + <edge from-layer="1095" from-port="1" to-layer="1098" to-port="0" /> + <edge from-layer="1096" from-port="0" to-layer="1098" to-port="1" /> + <edge from-layer="1097" from-port="0" to-layer="1098" to-port="2" /> + <edge from-layer="1098" from-port="3" to-layer="1099" to-port="1" /> + <edge from-layer="1099" from-port="2" to-layer="1111" to-port="0" /> + <edge from-layer="1099" from-port="2" to-layer="1104" to-port="0" /> + <edge from-layer="1100" from-port="1" to-layer="1129" to-port="0" /> + <edge from-layer="1100" from-port="1" to-layer="1103" to-port="0" /> + <edge from-layer="1101" from-port="0" to-layer="1103" to-port="1" /> + <edge from-layer="1102" from-port="0" to-layer="1103" to-port="2" /> + <edge from-layer="1103" from-port="3" to-layer="1104" to-port="1" /> + <edge from-layer="1104" from-port="2" to-layer="1106" to-port="0" /> + <edge from-layer="1105" from-port="0" to-layer="1106" to-port="1" /> + <edge from-layer="1106" from-port="2" to-layer="1108" to-port="2" /> + <edge from-layer="1107" from-port="0" to-layer="1108" to-port="3" /> + <edge from-layer="1107" from-port="0" to-layer="1112" to-port="3" /> + <edge from-layer="1108" from-port="4" to-layer="1114" to-port="1" /> + <edge from-layer="1109" from-port="0" to-layer="1112" to-port="0" /> + <edge from-layer="1110" from-port="0" to-layer="1111" to-port="1" /> + <edge from-layer="1111" from-port="2" to-layer="1119" to-port="2" /> + <edge from-layer="1111" from-port="2" to-layer="1112" to-port="2" /> + <edge from-layer="1112" from-port="4" to-layer="1114" to-port="2" /> + <edge from-layer="1113" from-port="0" to-layer="1114" to-port="3" /> + <edge from-layer="1114" from-port="4" to-layer="1121" to-port="0" /> + <edge from-layer="1115" from-port="0" to-layer="1121" to-port="1" /> + <edge from-layer="1116" from-port="0" to-layer="1119" to-port="0" /> + <edge from-layer="1117" from-port="0" to-layer="1119" to-port="1" /> + <edge from-layer="1118" from-port="0" to-layer="1119" to-port="3" /> + <edge from-layer="1119" from-port="4" to-layer="1121" to-port="2" /> + <edge from-layer="1120" from-port="0" to-layer="1121" to-port="3" /> + <edge from-layer="1121" from-port="4" to-layer="1124" to-port="0" /> + <edge from-layer="1122" from-port="0" to-layer="1124" to-port="1" /> + <edge from-layer="1123" from-port="0" to-layer="1124" to-port="2" /> + <edge from-layer="1124" from-port="3" to-layer="1125" to-port="0" /> + <edge from-layer="1125" from-port="2" to-layer="1135" to-port="0" /> + <edge from-layer="1125" from-port="2" to-layer="1126" to-port="0" /> + <edge from-layer="1126" from-port="1" to-layer="1134" to-port="0" /> + <edge from-layer="1127" from-port="0" to-layer="1129" to-port="1" /> + <edge from-layer="1128" from-port="0" to-layer="1129" to-port="2" /> + <edge from-layer="1129" from-port="3" to-layer="1133" to-port="0" /> + <edge from-layer="1130" from-port="0" to-layer="1133" to-port="1" /> + <edge from-layer="1131" from-port="0" to-layer="1133" to-port="2" /> + <edge from-layer="1132" from-port="0" to-layer="1133" to-port="3" /> + <edge from-layer="1133" from-port="4" to-layer="1134" to-port="1" /> + <edge from-layer="1134" from-port="2" to-layer="1135" to-port="1" /> + <edge from-layer="1135" from-port="2" to-layer="1136" to-port="3" /> + <edge from-layer="1136" from-port="4" to-layer="1138" to-port="0" /> + <edge from-layer="1137" from-port="0" to-layer="1138" to-port="1" /> + <edge from-layer="1138" from-port="2" to-layer="1140" to-port="0" /> + <edge from-layer="1139" from-port="0" to-layer="1140" to-port="1" /> + <edge from-layer="1140" from-port="2" to-layer="1149" to-port="0" /> + <edge from-layer="1141" from-port="0" to-layer="1142" to-port="0" /> + <edge from-layer="1142" from-port="1" to-layer="1145" to-port="0" /> + <edge from-layer="1143" from-port="0" to-layer="1144" to-port="0" /> + <edge from-layer="1144" from-port="1" to-layer="1145" to-port="1" /> + <edge from-layer="1145" from-port="2" to-layer="1147" to-port="0" /> + <edge from-layer="1146" from-port="0" to-layer="1147" to-port="1" /> + <edge from-layer="1147" from-port="2" to-layer="1148" to-port="0" /> + <edge from-layer="1148" from-port="1" to-layer="1149" to-port="1" /> + <edge from-layer="1149" from-port="2" to-layer="1151" to-port="0" /> + <edge from-layer="1150" from-port="0" to-layer="1151" to-port="1" /> + <edge from-layer="1151" from-port="2" to-layer="1152" to-port="0" /> + <edge from-layer="1152" from-port="2" to-layer="1182" to-port="1" /> + <edge from-layer="1152" from-port="2" to-layer="1154" to-port="0" /> + <edge from-layer="1153" from-port="0" to-layer="1154" to-port="1" /> + <edge from-layer="1154" from-port="2" to-layer="1156" to-port="0" /> + <edge from-layer="1155" from-port="0" to-layer="1156" to-port="1" /> + <edge from-layer="1156" from-port="2" to-layer="1158" to-port="0" /> + <edge from-layer="1157" from-port="0" to-layer="1158" to-port="1" /> + <edge from-layer="1158" from-port="2" to-layer="1167" to-port="0" /> + <edge from-layer="1159" from-port="0" to-layer="1160" to-port="0" /> + <edge from-layer="1160" from-port="1" to-layer="1163" to-port="0" /> + <edge from-layer="1161" from-port="0" to-layer="1162" to-port="0" /> + <edge from-layer="1162" from-port="1" to-layer="1163" to-port="1" /> + <edge from-layer="1163" from-port="2" to-layer="1165" to-port="0" /> + <edge from-layer="1164" from-port="0" to-layer="1165" to-port="1" /> + <edge from-layer="1165" from-port="2" to-layer="1166" to-port="0" /> + <edge from-layer="1166" from-port="1" to-layer="1167" to-port="1" /> + <edge from-layer="1167" from-port="2" to-layer="1169" to-port="0" /> + <edge from-layer="1168" from-port="0" to-layer="1169" to-port="1" /> + <edge from-layer="1169" from-port="2" to-layer="1170" to-port="0" /> + <edge from-layer="1170" from-port="1" to-layer="1179" to-port="0" /> + <edge from-layer="1171" from-port="0" to-layer="1172" to-port="0" /> + <edge from-layer="1172" from-port="1" to-layer="1175" to-port="0" /> + <edge from-layer="1173" from-port="0" to-layer="1174" to-port="0" /> + <edge from-layer="1174" from-port="1" to-layer="1175" to-port="1" /> + <edge from-layer="1175" from-port="2" to-layer="1177" to-port="0" /> + <edge from-layer="1176" from-port="0" to-layer="1177" to-port="1" /> + <edge from-layer="1177" from-port="2" to-layer="1178" to-port="0" /> + <edge from-layer="1178" from-port="1" to-layer="1179" to-port="1" /> + <edge from-layer="1179" from-port="2" to-layer="1181" to-port="0" /> + <edge from-layer="1180" from-port="0" to-layer="1181" to-port="1" /> + <edge from-layer="1181" from-port="2" to-layer="1182" to-port="0" /> + <edge from-layer="1182" from-port="2" to-layer="1184" to-port="0" /> + <edge from-layer="1182" from-port="2" to-layer="1379" to-port="1" /> + <edge from-layer="1183" from-port="0" to-layer="1184" to-port="1" /> + <edge from-layer="1184" from-port="2" to-layer="1186" to-port="0" /> + <edge from-layer="1185" from-port="0" to-layer="1186" to-port="1" /> + <edge from-layer="1186" from-port="2" to-layer="1188" to-port="0" /> + <edge from-layer="1187" from-port="0" to-layer="1188" to-port="1" /> + <edge from-layer="1188" from-port="2" to-layer="1197" to-port="0" /> + <edge from-layer="1189" from-port="0" to-layer="1190" to-port="0" /> + <edge from-layer="1190" from-port="1" to-layer="1193" to-port="0" /> + <edge from-layer="1191" from-port="0" to-layer="1192" to-port="0" /> + <edge from-layer="1192" from-port="1" to-layer="1193" to-port="1" /> + <edge from-layer="1193" from-port="2" to-layer="1195" to-port="0" /> + <edge from-layer="1194" from-port="0" to-layer="1195" to-port="1" /> + <edge from-layer="1195" from-port="2" to-layer="1196" to-port="0" /> + <edge from-layer="1196" from-port="1" to-layer="1197" to-port="1" /> + <edge from-layer="1197" from-port="2" to-layer="1199" to-port="0" /> + <edge from-layer="1198" from-port="0" to-layer="1199" to-port="1" /> + <edge from-layer="1199" from-port="2" to-layer="1201" to-port="0" /> + <edge from-layer="1200" from-port="0" to-layer="1201" to-port="1" /> + <edge from-layer="1201" from-port="2" to-layer="1315" to-port="0" /> + <edge from-layer="1201" from-port="2" to-layer="1217" to-port="0" /> + <edge from-layer="1201" from-port="2" to-layer="1205" to-port="0" /> + <edge from-layer="1202" from-port="0" to-layer="1205" to-port="1" /> + <edge from-layer="1203" from-port="0" to-layer="1205" to-port="2" /> + <edge from-layer="1204" from-port="0" to-layer="1205" to-port="3" /> + <edge from-layer="1205" from-port="4" to-layer="1207" to-port="0" /> + <edge from-layer="1206" from-port="0" to-layer="1207" to-port="1" /> + <edge from-layer="1207" from-port="2" to-layer="1211" to-port="0" /> + <edge from-layer="1208" from-port="0" to-layer="1211" to-port="1" /> + <edge from-layer="1209" from-port="0" to-layer="1211" to-port="2" /> + <edge from-layer="1210" from-port="0" to-layer="1211" to-port="3" /> + <edge from-layer="1211" from-port="4" to-layer="1262" to-port="0" /> + <edge from-layer="1211" from-port="4" to-layer="1257" to-port="0" /> + <edge from-layer="1211" from-port="4" to-layer="1246" to-port="0" /> + <edge from-layer="1211" from-port="4" to-layer="1243" to-port="0" /> + <edge from-layer="1212" from-port="0" to-layer="1239" to-port="0" /> + <edge from-layer="1213" from-port="0" to-layer="1239" to-port="1" /> + <edge from-layer="1214" from-port="0" to-layer="1217" to-port="1" /> + <edge from-layer="1215" from-port="0" to-layer="1217" to-port="2" /> + <edge from-layer="1216" from-port="0" to-layer="1217" to-port="3" /> + <edge from-layer="1217" from-port="4" to-layer="1274" to-port="0" /> + <edge from-layer="1217" from-port="4" to-layer="1218" to-port="0" /> + <edge from-layer="1218" from-port="1" to-layer="1221" to-port="0" /> + <edge from-layer="1219" from-port="0" to-layer="1221" to-port="1" /> + <edge from-layer="1220" from-port="0" to-layer="1221" to-port="2" /> + <edge from-layer="1221" from-port="3" to-layer="1237" to-port="0" /> + <edge from-layer="1222" from-port="0" to-layer="1227" to-port="0" /> + <edge from-layer="1223" from-port="0" to-layer="1226" to-port="1" /> + <edge from-layer="1224" from-port="0" to-layer="1226" to-port="2" /> + <edge from-layer="1225" from-port="0" to-layer="1226" to-port="3" /> + <edge from-layer="1226" from-port="4" to-layer="1227" to-port="1" /> + <edge from-layer="1227" from-port="2" to-layer="1228" to-port="0" /> + <edge from-layer="1228" from-port="1" to-layer="1230" to-port="0" /> + <edge from-layer="1229" from-port="0" to-layer="1230" to-port="2" /> + <edge from-layer="1230" from-port="3" to-layer="1231" to-port="0" /> + <edge from-layer="1230" from-port="3" to-layer="1302" to-port="0" /> + <edge from-layer="1231" from-port="1" to-layer="1234" to-port="0" /> + <edge from-layer="1232" from-port="0" to-layer="1234" to-port="1" /> + <edge from-layer="1233" from-port="0" to-layer="1234" to-port="2" /> + <edge from-layer="1234" from-port="3" to-layer="1236" to-port="0" /> + <edge from-layer="1234" from-port="3" to-layer="1326" to-port="0" /> + <edge from-layer="1235" from-port="0" to-layer="1236" to-port="1" /> + <edge from-layer="1236" from-port="2" to-layer="1237" to-port="1" /> + <edge from-layer="1237" from-port="2" to-layer="1239" to-port="2" /> + <edge from-layer="1237" from-port="2" to-layer="1267" to-port="2" /> + <edge from-layer="1238" from-port="0" to-layer="1239" to-port="3" /> + <edge from-layer="1239" from-port="4" to-layer="1241" to-port="0" /> + <edge from-layer="1240" from-port="0" to-layer="1241" to-port="2" /> + <edge from-layer="1241" from-port="3" to-layer="1242" to-port="0" /> + <edge from-layer="1242" from-port="2" to-layer="1279" to-port="1" /> + <edge from-layer="1242" from-port="2" to-layer="1243" to-port="1" /> + <edge from-layer="1243" from-port="2" to-layer="1272" to-port="0" /> + <edge from-layer="1244" from-port="0" to-layer="1254" to-port="0" /> + <edge from-layer="1245" from-port="0" to-layer="1254" to-port="1" /> + <edge from-layer="1246" from-port="1" to-layer="1248" to-port="0" /> + <edge from-layer="1247" from-port="0" to-layer="1248" to-port="2" /> + <edge from-layer="1248" from-port="3" to-layer="1249" to-port="0" /> + <edge from-layer="1249" from-port="2" to-layer="1250" to-port="0" /> + <edge from-layer="1250" from-port="1" to-layer="1252" to-port="0" /> + <edge from-layer="1251" from-port="0" to-layer="1252" to-port="1" /> + <edge from-layer="1252" from-port="2" to-layer="1254" to-port="2" /> + <edge from-layer="1253" from-port="0" to-layer="1254" to-port="3" /> + <edge from-layer="1254" from-port="4" to-layer="1257" to-port="1" /> + <edge from-layer="1254" from-port="4" to-layer="1262" to-port="2" /> + <edge from-layer="1255" from-port="0" to-layer="1257" to-port="2" /> + <edge from-layer="1256" from-port="0" to-layer="1257" to-port="3" /> + <edge from-layer="1257" from-port="4" to-layer="1259" to-port="0" /> + <edge from-layer="1258" from-port="0" to-layer="1259" to-port="1" /> + <edge from-layer="1259" from-port="2" to-layer="1263" to-port="0" /> + <edge from-layer="1260" from-port="0" to-layer="1262" to-port="1" /> + <edge from-layer="1261" from-port="0" to-layer="1262" to-port="3" /> + <edge from-layer="1262" from-port="4" to-layer="1263" to-port="1" /> + <edge from-layer="1263" from-port="2" to-layer="1271" to-port="0" /> + <edge from-layer="1264" from-port="0" to-layer="1267" to-port="0" /> + <edge from-layer="1265" from-port="0" to-layer="1267" to-port="1" /> + <edge from-layer="1266" from-port="0" to-layer="1267" to-port="3" /> + <edge from-layer="1267" from-port="4" to-layer="1269" to-port="0" /> + <edge from-layer="1268" from-port="0" to-layer="1269" to-port="2" /> + <edge from-layer="1269" from-port="3" to-layer="1270" to-port="0" /> + <edge from-layer="1270" from-port="2" to-layer="1271" to-port="1" /> + <edge from-layer="1270" from-port="2" to-layer="1300" to-port="1" /> + <edge from-layer="1271" from-port="2" to-layer="1272" to-port="1" /> + <edge from-layer="1272" from-port="2" to-layer="1327" to-port="0" /> + <edge from-layer="1272" from-port="2" to-layer="1363" to-port="0" /> + <edge from-layer="1273" from-port="0" to-layer="1274" to-port="1" /> + <edge from-layer="1274" from-port="2" to-layer="1278" to-port="0" /> + <edge from-layer="1275" from-port="0" to-layer="1278" to-port="1" /> + <edge from-layer="1276" from-port="0" to-layer="1278" to-port="2" /> + <edge from-layer="1277" from-port="0" to-layer="1278" to-port="3" /> + <edge from-layer="1278" from-port="4" to-layer="1279" to-port="0" /> + <edge from-layer="1278" from-port="4" to-layer="1282" to-port="0" /> + <edge from-layer="1278" from-port="4" to-layer="1293" to-port="0" /> + <edge from-layer="1278" from-port="4" to-layer="1298" to-port="0" /> + <edge from-layer="1279" from-port="2" to-layer="1301" to-port="0" /> + <edge from-layer="1280" from-port="0" to-layer="1290" to-port="0" /> + <edge from-layer="1281" from-port="0" to-layer="1290" to-port="1" /> + <edge from-layer="1282" from-port="1" to-layer="1284" to-port="0" /> + <edge from-layer="1283" from-port="0" to-layer="1284" to-port="2" /> + <edge from-layer="1284" from-port="3" to-layer="1285" to-port="0" /> + <edge from-layer="1285" from-port="2" to-layer="1286" to-port="0" /> + <edge from-layer="1286" from-port="1" to-layer="1288" to-port="0" /> + <edge from-layer="1287" from-port="0" to-layer="1288" to-port="1" /> + <edge from-layer="1288" from-port="2" to-layer="1290" to-port="2" /> + <edge from-layer="1289" from-port="0" to-layer="1290" to-port="3" /> + <edge from-layer="1290" from-port="4" to-layer="1298" to-port="2" /> + <edge from-layer="1290" from-port="4" to-layer="1293" to-port="1" /> + <edge from-layer="1291" from-port="0" to-layer="1293" to-port="2" /> + <edge from-layer="1292" from-port="0" to-layer="1293" to-port="3" /> + <edge from-layer="1293" from-port="4" to-layer="1295" to-port="0" /> + <edge from-layer="1294" from-port="0" to-layer="1295" to-port="1" /> + <edge from-layer="1295" from-port="2" to-layer="1299" to-port="0" /> + <edge from-layer="1296" from-port="0" to-layer="1298" to-port="1" /> + <edge from-layer="1297" from-port="0" to-layer="1298" to-port="3" /> + <edge from-layer="1298" from-port="4" to-layer="1299" to-port="1" /> + <edge from-layer="1299" from-port="2" to-layer="1300" to-port="0" /> + <edge from-layer="1300" from-port="2" to-layer="1301" to-port="1" /> + <edge from-layer="1301" from-port="2" to-layer="1302" to-port="1" /> + <edge from-layer="1301" from-port="2" to-layer="1322" to-port="0" /> + <edge from-layer="1302" from-port="2" to-layer="1363" to-port="1" /> + <edge from-layer="1302" from-port="2" to-layer="2194" to-port="0" /> + <edge from-layer="1303" from-port="0" to-layer="1308" to-port="0" /> + <edge from-layer="1304" from-port="0" to-layer="1307" to-port="1" /> + <edge from-layer="1305" from-port="0" to-layer="1307" to-port="2" /> + <edge from-layer="1306" from-port="0" to-layer="1307" to-port="3" /> + <edge from-layer="1307" from-port="4" to-layer="1308" to-port="1" /> + <edge from-layer="1308" from-port="2" to-layer="1309" to-port="0" /> + <edge from-layer="1309" from-port="1" to-layer="1311" to-port="0" /> + <edge from-layer="1310" from-port="0" to-layer="1311" to-port="2" /> + <edge from-layer="1311" from-port="3" to-layer="1318" to-port="0" /> + <edge from-layer="1312" from-port="0" to-layer="1315" to-port="1" /> + <edge from-layer="1313" from-port="0" to-layer="1315" to-port="2" /> + <edge from-layer="1314" from-port="0" to-layer="1315" to-port="3" /> + <edge from-layer="1315" from-port="4" to-layer="1317" to-port="0" /> + <edge from-layer="1316" from-port="0" to-layer="1317" to-port="1" /> + <edge from-layer="1317" from-port="2" to-layer="1318" to-port="1" /> + <edge from-layer="1318" from-port="2" to-layer="1363" to-port="2" /> + <edge from-layer="1318" from-port="2" to-layer="2193" to-port="0" /> + <edge from-layer="1319" from-port="0" to-layer="1341" to-port="0" /> + <edge from-layer="1320" from-port="0" to-layer="1335" to-port="0" /> + <edge from-layer="1321" from-port="0" to-layer="1335" to-port="1" /> + <edge from-layer="1321" from-port="0" to-layer="1339" to-port="1" /> + <edge from-layer="1322" from-port="1" to-layer="1325" to-port="0" /> + <edge from-layer="1323" from-port="0" to-layer="1325" to-port="1" /> + <edge from-layer="1324" from-port="0" to-layer="1325" to-port="2" /> + <edge from-layer="1325" from-port="3" to-layer="1326" to-port="1" /> + <edge from-layer="1326" from-port="2" to-layer="1331" to-port="0" /> + <edge from-layer="1326" from-port="2" to-layer="1338" to-port="0" /> + <edge from-layer="1327" from-port="1" to-layer="1356" to-port="0" /> + <edge from-layer="1327" from-port="1" to-layer="1330" to-port="0" /> + <edge from-layer="1328" from-port="0" to-layer="1330" to-port="1" /> + <edge from-layer="1329" from-port="0" to-layer="1330" to-port="2" /> + <edge from-layer="1330" from-port="3" to-layer="1331" to-port="1" /> + <edge from-layer="1331" from-port="2" to-layer="1333" to-port="0" /> + <edge from-layer="1332" from-port="0" to-layer="1333" to-port="1" /> + <edge from-layer="1333" from-port="2" to-layer="1335" to-port="2" /> + <edge from-layer="1334" from-port="0" to-layer="1335" to-port="3" /> + <edge from-layer="1334" from-port="0" to-layer="1339" to-port="3" /> + <edge from-layer="1335" from-port="4" to-layer="1341" to-port="1" /> + <edge from-layer="1336" from-port="0" to-layer="1339" to-port="0" /> + <edge from-layer="1337" from-port="0" to-layer="1338" to-port="1" /> + <edge from-layer="1338" from-port="2" to-layer="1339" to-port="2" /> + <edge from-layer="1338" from-port="2" to-layer="1346" to-port="2" /> + <edge from-layer="1339" from-port="4" to-layer="1341" to-port="2" /> + <edge from-layer="1340" from-port="0" to-layer="1341" to-port="3" /> + <edge from-layer="1341" from-port="4" to-layer="1348" to-port="0" /> + <edge from-layer="1342" from-port="0" to-layer="1348" to-port="1" /> + <edge from-layer="1343" from-port="0" to-layer="1346" to-port="0" /> + <edge from-layer="1344" from-port="0" to-layer="1346" to-port="1" /> + <edge from-layer="1345" from-port="0" to-layer="1346" to-port="3" /> + <edge from-layer="1346" from-port="4" to-layer="1348" to-port="2" /> + <edge from-layer="1347" from-port="0" to-layer="1348" to-port="3" /> + <edge from-layer="1348" from-port="4" to-layer="1351" to-port="0" /> + <edge from-layer="1349" from-port="0" to-layer="1351" to-port="1" /> + <edge from-layer="1350" from-port="0" to-layer="1351" to-port="2" /> + <edge from-layer="1351" from-port="3" to-layer="1352" to-port="0" /> + <edge from-layer="1352" from-port="2" to-layer="1353" to-port="0" /> + <edge from-layer="1352" from-port="2" to-layer="1362" to-port="0" /> + <edge from-layer="1353" from-port="1" to-layer="1361" to-port="0" /> + <edge from-layer="1354" from-port="0" to-layer="1356" to-port="1" /> + <edge from-layer="1355" from-port="0" to-layer="1356" to-port="2" /> + <edge from-layer="1356" from-port="3" to-layer="1360" to-port="0" /> + <edge from-layer="1357" from-port="0" to-layer="1360" to-port="1" /> + <edge from-layer="1358" from-port="0" to-layer="1360" to-port="2" /> + <edge from-layer="1359" from-port="0" to-layer="1360" to-port="3" /> + <edge from-layer="1360" from-port="4" to-layer="1361" to-port="1" /> + <edge from-layer="1361" from-port="2" to-layer="1362" to-port="1" /> + <edge from-layer="1362" from-port="2" to-layer="1363" to-port="3" /> + <edge from-layer="1363" from-port="4" to-layer="1365" to-port="0" /> + <edge from-layer="1364" from-port="0" to-layer="1365" to-port="1" /> + <edge from-layer="1365" from-port="2" to-layer="1367" to-port="0" /> + <edge from-layer="1366" from-port="0" to-layer="1367" to-port="1" /> + <edge from-layer="1367" from-port="2" to-layer="1376" to-port="0" /> + <edge from-layer="1368" from-port="0" to-layer="1369" to-port="0" /> + <edge from-layer="1369" from-port="1" to-layer="1372" to-port="0" /> + <edge from-layer="1370" from-port="0" to-layer="1371" to-port="0" /> + <edge from-layer="1371" from-port="1" to-layer="1372" to-port="1" /> + <edge from-layer="1372" from-port="2" to-layer="1374" to-port="0" /> + <edge from-layer="1373" from-port="0" to-layer="1374" to-port="1" /> + <edge from-layer="1374" from-port="2" to-layer="1375" to-port="0" /> + <edge from-layer="1375" from-port="1" to-layer="1376" to-port="1" /> + <edge from-layer="1376" from-port="2" to-layer="1378" to-port="0" /> + <edge from-layer="1377" from-port="0" to-layer="1378" to-port="1" /> + <edge from-layer="1378" from-port="2" to-layer="1379" to-port="0" /> + <edge from-layer="1379" from-port="2" to-layer="1381" to-port="0" /> + <edge from-layer="1379" from-port="2" to-layer="1409" to-port="1" /> + <edge from-layer="1380" from-port="0" to-layer="1381" to-port="1" /> + <edge from-layer="1381" from-port="2" to-layer="1383" to-port="0" /> + <edge from-layer="1382" from-port="0" to-layer="1383" to-port="1" /> + <edge from-layer="1383" from-port="2" to-layer="1385" to-port="0" /> + <edge from-layer="1384" from-port="0" to-layer="1385" to-port="1" /> + <edge from-layer="1385" from-port="2" to-layer="1394" to-port="0" /> + <edge from-layer="1386" from-port="0" to-layer="1387" to-port="0" /> + <edge from-layer="1387" from-port="1" to-layer="1390" to-port="0" /> + <edge from-layer="1388" from-port="0" to-layer="1389" to-port="0" /> + <edge from-layer="1389" from-port="1" to-layer="1390" to-port="1" /> + <edge from-layer="1390" from-port="2" to-layer="1392" to-port="0" /> + <edge from-layer="1391" from-port="0" to-layer="1392" to-port="1" /> + <edge from-layer="1392" from-port="2" to-layer="1393" to-port="0" /> + <edge from-layer="1393" from-port="1" to-layer="1394" to-port="1" /> + <edge from-layer="1394" from-port="2" to-layer="1396" to-port="0" /> + <edge from-layer="1395" from-port="0" to-layer="1396" to-port="1" /> + <edge from-layer="1396" from-port="2" to-layer="1397" to-port="0" /> + <edge from-layer="1397" from-port="1" to-layer="1406" to-port="0" /> + <edge from-layer="1398" from-port="0" to-layer="1399" to-port="0" /> + <edge from-layer="1399" from-port="1" to-layer="1402" to-port="0" /> + <edge from-layer="1400" from-port="0" to-layer="1401" to-port="0" /> + <edge from-layer="1401" from-port="1" to-layer="1402" to-port="1" /> + <edge from-layer="1402" from-port="2" to-layer="1404" to-port="0" /> + <edge from-layer="1403" from-port="0" to-layer="1404" to-port="1" /> + <edge from-layer="1404" from-port="2" to-layer="1405" to-port="0" /> + <edge from-layer="1405" from-port="1" to-layer="1406" to-port="1" /> + <edge from-layer="1406" from-port="2" to-layer="1408" to-port="0" /> + <edge from-layer="1407" from-port="0" to-layer="1408" to-port="1" /> + <edge from-layer="1408" from-port="2" to-layer="1409" to-port="0" /> + <edge from-layer="1409" from-port="2" to-layer="1411" to-port="0" /> + <edge from-layer="1409" from-port="2" to-layer="1606" to-port="1" /> + <edge from-layer="1410" from-port="0" to-layer="1411" to-port="1" /> + <edge from-layer="1411" from-port="2" to-layer="1413" to-port="0" /> + <edge from-layer="1412" from-port="0" to-layer="1413" to-port="1" /> + <edge from-layer="1413" from-port="2" to-layer="1415" to-port="0" /> + <edge from-layer="1414" from-port="0" to-layer="1415" to-port="1" /> + <edge from-layer="1415" from-port="2" to-layer="1424" to-port="0" /> + <edge from-layer="1416" from-port="0" to-layer="1417" to-port="0" /> + <edge from-layer="1417" from-port="1" to-layer="1420" to-port="0" /> + <edge from-layer="1418" from-port="0" to-layer="1419" to-port="0" /> + <edge from-layer="1419" from-port="1" to-layer="1420" to-port="1" /> + <edge from-layer="1420" from-port="2" to-layer="1422" to-port="0" /> + <edge from-layer="1421" from-port="0" to-layer="1422" to-port="1" /> + <edge from-layer="1422" from-port="2" to-layer="1423" to-port="0" /> + <edge from-layer="1423" from-port="1" to-layer="1424" to-port="1" /> + <edge from-layer="1424" from-port="2" to-layer="1426" to-port="0" /> + <edge from-layer="1425" from-port="0" to-layer="1426" to-port="1" /> + <edge from-layer="1426" from-port="2" to-layer="1428" to-port="0" /> + <edge from-layer="1427" from-port="0" to-layer="1428" to-port="1" /> + <edge from-layer="1428" from-port="2" to-layer="1444" to-port="0" /> + <edge from-layer="1428" from-port="2" to-layer="1542" to-port="0" /> + <edge from-layer="1428" from-port="2" to-layer="1432" to-port="0" /> + <edge from-layer="1429" from-port="0" to-layer="1432" to-port="1" /> + <edge from-layer="1430" from-port="0" to-layer="1432" to-port="2" /> + <edge from-layer="1431" from-port="0" to-layer="1432" to-port="3" /> + <edge from-layer="1432" from-port="4" to-layer="1434" to-port="0" /> + <edge from-layer="1433" from-port="0" to-layer="1434" to-port="1" /> + <edge from-layer="1434" from-port="2" to-layer="1438" to-port="0" /> + <edge from-layer="1435" from-port="0" to-layer="1438" to-port="1" /> + <edge from-layer="1436" from-port="0" to-layer="1438" to-port="2" /> + <edge from-layer="1437" from-port="0" to-layer="1438" to-port="3" /> + <edge from-layer="1438" from-port="4" to-layer="1484" to-port="0" /> + <edge from-layer="1438" from-port="4" to-layer="1470" to-port="0" /> + <edge from-layer="1438" from-port="4" to-layer="1473" to-port="0" /> + <edge from-layer="1438" from-port="4" to-layer="1489" to-port="0" /> + <edge from-layer="1439" from-port="0" to-layer="1466" to-port="0" /> + <edge from-layer="1440" from-port="0" to-layer="1466" to-port="1" /> + <edge from-layer="1441" from-port="0" to-layer="1444" to-port="1" /> + <edge from-layer="1442" from-port="0" to-layer="1444" to-port="2" /> + <edge from-layer="1443" from-port="0" to-layer="1444" to-port="3" /> + <edge from-layer="1444" from-port="4" to-layer="1445" to-port="0" /> + <edge from-layer="1444" from-port="4" to-layer="1501" to-port="0" /> + <edge from-layer="1445" from-port="1" to-layer="1448" to-port="0" /> + <edge from-layer="1446" from-port="0" to-layer="1448" to-port="1" /> + <edge from-layer="1447" from-port="0" to-layer="1448" to-port="2" /> + <edge from-layer="1448" from-port="3" to-layer="1464" to-port="0" /> + <edge from-layer="1449" from-port="0" to-layer="1454" to-port="0" /> + <edge from-layer="1450" from-port="0" to-layer="1453" to-port="1" /> + <edge from-layer="1451" from-port="0" to-layer="1453" to-port="2" /> + <edge from-layer="1452" from-port="0" to-layer="1453" to-port="3" /> + <edge from-layer="1453" from-port="4" to-layer="1454" to-port="1" /> + <edge from-layer="1454" from-port="2" to-layer="1455" to-port="0" /> + <edge from-layer="1455" from-port="1" to-layer="1457" to-port="0" /> + <edge from-layer="1456" from-port="0" to-layer="1457" to-port="2" /> + <edge from-layer="1457" from-port="3" to-layer="1529" to-port="0" /> + <edge from-layer="1457" from-port="3" to-layer="1458" to-port="0" /> + <edge from-layer="1458" from-port="1" to-layer="1461" to-port="0" /> + <edge from-layer="1459" from-port="0" to-layer="1461" to-port="1" /> + <edge from-layer="1460" from-port="0" to-layer="1461" to-port="2" /> + <edge from-layer="1461" from-port="3" to-layer="1553" to-port="0" /> + <edge from-layer="1461" from-port="3" to-layer="1463" to-port="0" /> + <edge from-layer="1462" from-port="0" to-layer="1463" to-port="1" /> + <edge from-layer="1463" from-port="2" to-layer="1464" to-port="1" /> + <edge from-layer="1464" from-port="2" to-layer="1466" to-port="2" /> + <edge from-layer="1464" from-port="2" to-layer="1494" to-port="2" /> + <edge from-layer="1465" from-port="0" to-layer="1466" to-port="3" /> + <edge from-layer="1466" from-port="4" to-layer="1468" to-port="0" /> + <edge from-layer="1467" from-port="0" to-layer="1468" to-port="2" /> + <edge from-layer="1468" from-port="3" to-layer="1469" to-port="0" /> + <edge from-layer="1469" from-port="2" to-layer="1506" to-port="1" /> + <edge from-layer="1469" from-port="2" to-layer="1470" to-port="1" /> + <edge from-layer="1470" from-port="2" to-layer="1499" to-port="0" /> + <edge from-layer="1471" from-port="0" to-layer="1481" to-port="0" /> + <edge from-layer="1472" from-port="0" to-layer="1481" to-port="1" /> + <edge from-layer="1473" from-port="1" to-layer="1475" to-port="0" /> + <edge from-layer="1474" from-port="0" to-layer="1475" to-port="2" /> + <edge from-layer="1475" from-port="3" to-layer="1476" to-port="0" /> + <edge from-layer="1476" from-port="2" to-layer="1477" to-port="0" /> + <edge from-layer="1477" from-port="1" to-layer="1479" to-port="0" /> + <edge from-layer="1478" from-port="0" to-layer="1479" to-port="1" /> + <edge from-layer="1479" from-port="2" to-layer="1481" to-port="2" /> + <edge from-layer="1480" from-port="0" to-layer="1481" to-port="3" /> + <edge from-layer="1481" from-port="4" to-layer="1484" to-port="1" /> + <edge from-layer="1481" from-port="4" to-layer="1489" to-port="2" /> + <edge from-layer="1482" from-port="0" to-layer="1484" to-port="2" /> + <edge from-layer="1483" from-port="0" to-layer="1484" to-port="3" /> + <edge from-layer="1484" from-port="4" to-layer="1486" to-port="0" /> + <edge from-layer="1485" from-port="0" to-layer="1486" to-port="1" /> + <edge from-layer="1486" from-port="2" to-layer="1490" to-port="0" /> + <edge from-layer="1487" from-port="0" to-layer="1489" to-port="1" /> + <edge from-layer="1488" from-port="0" to-layer="1489" to-port="3" /> + <edge from-layer="1489" from-port="4" to-layer="1490" to-port="1" /> + <edge from-layer="1490" from-port="2" to-layer="1498" to-port="0" /> + <edge from-layer="1491" from-port="0" to-layer="1494" to-port="0" /> + <edge from-layer="1492" from-port="0" to-layer="1494" to-port="1" /> + <edge from-layer="1493" from-port="0" to-layer="1494" to-port="3" /> + <edge from-layer="1494" from-port="4" to-layer="1496" to-port="0" /> + <edge from-layer="1495" from-port="0" to-layer="1496" to-port="2" /> + <edge from-layer="1496" from-port="3" to-layer="1497" to-port="0" /> + <edge from-layer="1497" from-port="2" to-layer="1498" to-port="1" /> + <edge from-layer="1497" from-port="2" to-layer="1527" to-port="1" /> + <edge from-layer="1498" from-port="2" to-layer="1499" to-port="1" /> + <edge from-layer="1499" from-port="2" to-layer="1554" to-port="0" /> + <edge from-layer="1499" from-port="2" to-layer="1590" to-port="0" /> + <edge from-layer="1500" from-port="0" to-layer="1501" to-port="1" /> + <edge from-layer="1501" from-port="2" to-layer="1505" to-port="0" /> + <edge from-layer="1502" from-port="0" to-layer="1505" to-port="1" /> + <edge from-layer="1503" from-port="0" to-layer="1505" to-port="2" /> + <edge from-layer="1504" from-port="0" to-layer="1505" to-port="3" /> + <edge from-layer="1505" from-port="4" to-layer="1520" to-port="0" /> + <edge from-layer="1505" from-port="4" to-layer="1506" to-port="0" /> + <edge from-layer="1505" from-port="4" to-layer="1509" to-port="0" /> + <edge from-layer="1505" from-port="4" to-layer="1525" to-port="0" /> + <edge from-layer="1506" from-port="2" to-layer="1528" to-port="0" /> + <edge from-layer="1507" from-port="0" to-layer="1517" to-port="0" /> + <edge from-layer="1508" from-port="0" to-layer="1517" to-port="1" /> + <edge from-layer="1509" from-port="1" to-layer="1511" to-port="0" /> + <edge from-layer="1510" from-port="0" to-layer="1511" to-port="2" /> + <edge from-layer="1511" from-port="3" to-layer="1512" to-port="0" /> + <edge from-layer="1512" from-port="2" to-layer="1513" to-port="0" /> + <edge from-layer="1513" from-port="1" to-layer="1515" to-port="0" /> + <edge from-layer="1514" from-port="0" to-layer="1515" to-port="1" /> + <edge from-layer="1515" from-port="2" to-layer="1517" to-port="2" /> + <edge from-layer="1516" from-port="0" to-layer="1517" to-port="3" /> + <edge from-layer="1517" from-port="4" to-layer="1520" to-port="1" /> + <edge from-layer="1517" from-port="4" to-layer="1525" to-port="2" /> + <edge from-layer="1518" from-port="0" to-layer="1520" to-port="2" /> + <edge from-layer="1519" from-port="0" to-layer="1520" to-port="3" /> + <edge from-layer="1520" from-port="4" to-layer="1522" to-port="0" /> + <edge from-layer="1521" from-port="0" to-layer="1522" to-port="1" /> + <edge from-layer="1522" from-port="2" to-layer="1526" to-port="0" /> + <edge from-layer="1523" from-port="0" to-layer="1525" to-port="1" /> + <edge from-layer="1524" from-port="0" to-layer="1525" to-port="3" /> + <edge from-layer="1525" from-port="4" to-layer="1526" to-port="1" /> + <edge from-layer="1526" from-port="2" to-layer="1527" to-port="0" /> + <edge from-layer="1527" from-port="2" to-layer="1528" to-port="1" /> + <edge from-layer="1528" from-port="2" to-layer="1549" to-port="0" /> + <edge from-layer="1528" from-port="2" to-layer="1529" to-port="1" /> + <edge from-layer="1529" from-port="2" to-layer="1590" to-port="1" /> + <edge from-layer="1529" from-port="2" to-layer="2192" to-port="0" /> + <edge from-layer="1530" from-port="0" to-layer="1535" to-port="0" /> + <edge from-layer="1531" from-port="0" to-layer="1534" to-port="1" /> + <edge from-layer="1532" from-port="0" to-layer="1534" to-port="2" /> + <edge from-layer="1533" from-port="0" to-layer="1534" to-port="3" /> + <edge from-layer="1534" from-port="4" to-layer="1535" to-port="1" /> + <edge from-layer="1535" from-port="2" to-layer="1536" to-port="0" /> + <edge from-layer="1536" from-port="1" to-layer="1538" to-port="0" /> + <edge from-layer="1537" from-port="0" to-layer="1538" to-port="2" /> + <edge from-layer="1538" from-port="3" to-layer="1545" to-port="0" /> + <edge from-layer="1539" from-port="0" to-layer="1542" to-port="1" /> + <edge from-layer="1540" from-port="0" to-layer="1542" to-port="2" /> + <edge from-layer="1541" from-port="0" to-layer="1542" to-port="3" /> + <edge from-layer="1542" from-port="4" to-layer="1544" to-port="0" /> + <edge from-layer="1543" from-port="0" to-layer="1544" to-port="1" /> + <edge from-layer="1544" from-port="2" to-layer="1545" to-port="1" /> + <edge from-layer="1545" from-port="2" to-layer="2191" to-port="0" /> + <edge from-layer="1545" from-port="2" to-layer="1590" to-port="2" /> + <edge from-layer="1546" from-port="0" to-layer="1568" to-port="0" /> + <edge from-layer="1547" from-port="0" to-layer="1562" to-port="0" /> + <edge from-layer="1548" from-port="0" to-layer="1562" to-port="1" /> + <edge from-layer="1548" from-port="0" to-layer="1566" to-port="1" /> + <edge from-layer="1549" from-port="1" to-layer="1552" to-port="0" /> + <edge from-layer="1550" from-port="0" to-layer="1552" to-port="1" /> + <edge from-layer="1551" from-port="0" to-layer="1552" to-port="2" /> + <edge from-layer="1552" from-port="3" to-layer="1553" to-port="1" /> + <edge from-layer="1553" from-port="2" to-layer="1565" to-port="0" /> + <edge from-layer="1553" from-port="2" to-layer="1558" to-port="0" /> + <edge from-layer="1554" from-port="1" to-layer="1557" to-port="0" /> + <edge from-layer="1554" from-port="1" to-layer="1583" to-port="0" /> + <edge from-layer="1555" from-port="0" to-layer="1557" to-port="1" /> + <edge from-layer="1556" from-port="0" to-layer="1557" to-port="2" /> + <edge from-layer="1557" from-port="3" to-layer="1558" to-port="1" /> + <edge from-layer="1558" from-port="2" to-layer="1560" to-port="0" /> + <edge from-layer="1559" from-port="0" to-layer="1560" to-port="1" /> + <edge from-layer="1560" from-port="2" to-layer="1562" to-port="2" /> + <edge from-layer="1561" from-port="0" to-layer="1566" to-port="3" /> + <edge from-layer="1561" from-port="0" to-layer="1562" to-port="3" /> + <edge from-layer="1562" from-port="4" to-layer="1568" to-port="1" /> + <edge from-layer="1563" from-port="0" to-layer="1566" to-port="0" /> + <edge from-layer="1564" from-port="0" to-layer="1565" to-port="1" /> + <edge from-layer="1565" from-port="2" to-layer="1573" to-port="2" /> + <edge from-layer="1565" from-port="2" to-layer="1566" to-port="2" /> + <edge from-layer="1566" from-port="4" to-layer="1568" to-port="2" /> + <edge from-layer="1567" from-port="0" to-layer="1568" to-port="3" /> + <edge from-layer="1568" from-port="4" to-layer="1575" to-port="0" /> + <edge from-layer="1569" from-port="0" to-layer="1575" to-port="1" /> + <edge from-layer="1570" from-port="0" to-layer="1573" to-port="0" /> + <edge from-layer="1571" from-port="0" to-layer="1573" to-port="1" /> + <edge from-layer="1572" from-port="0" to-layer="1573" to-port="3" /> + <edge from-layer="1573" from-port="4" to-layer="1575" to-port="2" /> + <edge from-layer="1574" from-port="0" to-layer="1575" to-port="3" /> + <edge from-layer="1575" from-port="4" to-layer="1578" to-port="0" /> + <edge from-layer="1576" from-port="0" to-layer="1578" to-port="1" /> + <edge from-layer="1577" from-port="0" to-layer="1578" to-port="2" /> + <edge from-layer="1578" from-port="3" to-layer="1579" to-port="0" /> + <edge from-layer="1579" from-port="2" to-layer="1589" to-port="0" /> + <edge from-layer="1579" from-port="2" to-layer="1580" to-port="0" /> + <edge from-layer="1580" from-port="1" to-layer="1588" to-port="0" /> + <edge from-layer="1581" from-port="0" to-layer="1583" to-port="1" /> + <edge from-layer="1582" from-port="0" to-layer="1583" to-port="2" /> + <edge from-layer="1583" from-port="3" to-layer="1587" to-port="0" /> + <edge from-layer="1584" from-port="0" to-layer="1587" to-port="1" /> + <edge from-layer="1585" from-port="0" to-layer="1587" to-port="2" /> + <edge from-layer="1586" from-port="0" to-layer="1587" to-port="3" /> + <edge from-layer="1587" from-port="4" to-layer="1588" to-port="1" /> + <edge from-layer="1588" from-port="2" to-layer="1589" to-port="1" /> + <edge from-layer="1589" from-port="2" to-layer="1590" to-port="3" /> + <edge from-layer="1590" from-port="4" to-layer="1592" to-port="0" /> + <edge from-layer="1591" from-port="0" to-layer="1592" to-port="1" /> + <edge from-layer="1592" from-port="2" to-layer="1594" to-port="0" /> + <edge from-layer="1593" from-port="0" to-layer="1594" to-port="1" /> + <edge from-layer="1594" from-port="2" to-layer="1603" to-port="0" /> + <edge from-layer="1595" from-port="0" to-layer="1596" to-port="0" /> + <edge from-layer="1596" from-port="1" to-layer="1599" to-port="0" /> + <edge from-layer="1597" from-port="0" to-layer="1598" to-port="0" /> + <edge from-layer="1598" from-port="1" to-layer="1599" to-port="1" /> + <edge from-layer="1599" from-port="2" to-layer="1601" to-port="0" /> + <edge from-layer="1600" from-port="0" to-layer="1601" to-port="1" /> + <edge from-layer="1601" from-port="2" to-layer="1602" to-port="0" /> + <edge from-layer="1602" from-port="1" to-layer="1603" to-port="1" /> + <edge from-layer="1603" from-port="2" to-layer="1605" to-port="0" /> + <edge from-layer="1604" from-port="0" to-layer="1605" to-port="1" /> + <edge from-layer="1605" from-port="2" to-layer="1606" to-port="0" /> + <edge from-layer="1606" from-port="2" to-layer="1608" to-port="0" /> + <edge from-layer="1606" from-port="2" to-layer="1636" to-port="1" /> + <edge from-layer="1607" from-port="0" to-layer="1608" to-port="1" /> + <edge from-layer="1608" from-port="2" to-layer="1610" to-port="0" /> + <edge from-layer="1609" from-port="0" to-layer="1610" to-port="1" /> + <edge from-layer="1610" from-port="2" to-layer="1612" to-port="0" /> + <edge from-layer="1611" from-port="0" to-layer="1612" to-port="1" /> + <edge from-layer="1612" from-port="2" to-layer="1621" to-port="0" /> + <edge from-layer="1613" from-port="0" to-layer="1614" to-port="0" /> + <edge from-layer="1614" from-port="1" to-layer="1617" to-port="0" /> + <edge from-layer="1615" from-port="0" to-layer="1616" to-port="0" /> + <edge from-layer="1616" from-port="1" to-layer="1617" to-port="1" /> + <edge from-layer="1617" from-port="2" to-layer="1619" to-port="0" /> + <edge from-layer="1618" from-port="0" to-layer="1619" to-port="1" /> + <edge from-layer="1619" from-port="2" to-layer="1620" to-port="0" /> + <edge from-layer="1620" from-port="1" to-layer="1621" to-port="1" /> + <edge from-layer="1621" from-port="2" to-layer="1623" to-port="0" /> + <edge from-layer="1622" from-port="0" to-layer="1623" to-port="1" /> + <edge from-layer="1623" from-port="2" to-layer="1624" to-port="0" /> + <edge from-layer="1624" from-port="1" to-layer="1633" to-port="0" /> + <edge from-layer="1625" from-port="0" to-layer="1626" to-port="0" /> + <edge from-layer="1626" from-port="1" to-layer="1629" to-port="0" /> + <edge from-layer="1627" from-port="0" to-layer="1628" to-port="0" /> + <edge from-layer="1628" from-port="1" to-layer="1629" to-port="1" /> + <edge from-layer="1629" from-port="2" to-layer="1631" to-port="0" /> + <edge from-layer="1630" from-port="0" to-layer="1631" to-port="1" /> + <edge from-layer="1631" from-port="2" to-layer="1632" to-port="0" /> + <edge from-layer="1632" from-port="1" to-layer="1633" to-port="1" /> + <edge from-layer="1633" from-port="2" to-layer="1635" to-port="0" /> + <edge from-layer="1634" from-port="0" to-layer="1635" to-port="1" /> + <edge from-layer="1635" from-port="2" to-layer="1636" to-port="0" /> + <edge from-layer="1636" from-port="2" to-layer="1638" to-port="0" /> + <edge from-layer="1636" from-port="2" to-layer="1833" to-port="1" /> + <edge from-layer="1637" from-port="0" to-layer="1638" to-port="1" /> + <edge from-layer="1638" from-port="2" to-layer="1640" to-port="0" /> + <edge from-layer="1639" from-port="0" to-layer="1640" to-port="1" /> + <edge from-layer="1640" from-port="2" to-layer="1642" to-port="0" /> + <edge from-layer="1641" from-port="0" to-layer="1642" to-port="1" /> + <edge from-layer="1642" from-port="2" to-layer="1651" to-port="0" /> + <edge from-layer="1643" from-port="0" to-layer="1644" to-port="0" /> + <edge from-layer="1644" from-port="1" to-layer="1647" to-port="0" /> + <edge from-layer="1645" from-port="0" to-layer="1646" to-port="0" /> + <edge from-layer="1646" from-port="1" to-layer="1647" to-port="1" /> + <edge from-layer="1647" from-port="2" to-layer="1649" to-port="0" /> + <edge from-layer="1648" from-port="0" to-layer="1649" to-port="1" /> + <edge from-layer="1649" from-port="2" to-layer="1650" to-port="0" /> + <edge from-layer="1650" from-port="1" to-layer="1651" to-port="1" /> + <edge from-layer="1651" from-port="2" to-layer="1653" to-port="0" /> + <edge from-layer="1652" from-port="0" to-layer="1653" to-port="1" /> + <edge from-layer="1653" from-port="2" to-layer="1655" to-port="0" /> + <edge from-layer="1654" from-port="0" to-layer="1655" to-port="1" /> + <edge from-layer="1655" from-port="2" to-layer="1659" to-port="0" /> + <edge from-layer="1655" from-port="2" to-layer="1769" to-port="0" /> + <edge from-layer="1655" from-port="2" to-layer="1671" to-port="0" /> + <edge from-layer="1656" from-port="0" to-layer="1659" to-port="1" /> + <edge from-layer="1657" from-port="0" to-layer="1659" to-port="2" /> + <edge from-layer="1658" from-port="0" to-layer="1659" to-port="3" /> + <edge from-layer="1659" from-port="4" to-layer="1661" to-port="0" /> + <edge from-layer="1660" from-port="0" to-layer="1661" to-port="1" /> + <edge from-layer="1661" from-port="2" to-layer="1665" to-port="0" /> + <edge from-layer="1662" from-port="0" to-layer="1665" to-port="1" /> + <edge from-layer="1663" from-port="0" to-layer="1665" to-port="2" /> + <edge from-layer="1664" from-port="0" to-layer="1665" to-port="3" /> + <edge from-layer="1665" from-port="4" to-layer="1716" to-port="0" /> + <edge from-layer="1665" from-port="4" to-layer="1700" to-port="0" /> + <edge from-layer="1665" from-port="4" to-layer="1697" to-port="0" /> + <edge from-layer="1665" from-port="4" to-layer="1711" to-port="0" /> + <edge from-layer="1666" from-port="0" to-layer="1693" to-port="0" /> + <edge from-layer="1667" from-port="0" to-layer="1693" to-port="1" /> + <edge from-layer="1668" from-port="0" to-layer="1671" to-port="1" /> + <edge from-layer="1669" from-port="0" to-layer="1671" to-port="2" /> + <edge from-layer="1670" from-port="0" to-layer="1671" to-port="3" /> + <edge from-layer="1671" from-port="4" to-layer="1672" to-port="0" /> + <edge from-layer="1671" from-port="4" to-layer="1728" to-port="0" /> + <edge from-layer="1672" from-port="1" to-layer="1675" to-port="0" /> + <edge from-layer="1673" from-port="0" to-layer="1675" to-port="1" /> + <edge from-layer="1674" from-port="0" to-layer="1675" to-port="2" /> + <edge from-layer="1675" from-port="3" to-layer="1691" to-port="0" /> + <edge from-layer="1676" from-port="0" to-layer="1681" to-port="0" /> + <edge from-layer="1677" from-port="0" to-layer="1680" to-port="1" /> + <edge from-layer="1678" from-port="0" to-layer="1680" to-port="2" /> + <edge from-layer="1679" from-port="0" to-layer="1680" to-port="3" /> + <edge from-layer="1680" from-port="4" to-layer="1681" to-port="1" /> + <edge from-layer="1681" from-port="2" to-layer="1682" to-port="0" /> + <edge from-layer="1682" from-port="1" to-layer="1684" to-port="0" /> + <edge from-layer="1683" from-port="0" to-layer="1684" to-port="2" /> + <edge from-layer="1684" from-port="3" to-layer="1756" to-port="0" /> + <edge from-layer="1684" from-port="3" to-layer="1685" to-port="0" /> + <edge from-layer="1685" from-port="1" to-layer="1688" to-port="0" /> + <edge from-layer="1686" from-port="0" to-layer="1688" to-port="1" /> + <edge from-layer="1687" from-port="0" to-layer="1688" to-port="2" /> + <edge from-layer="1688" from-port="3" to-layer="1780" to-port="0" /> + <edge from-layer="1688" from-port="3" to-layer="1690" to-port="0" /> + <edge from-layer="1689" from-port="0" to-layer="1690" to-port="1" /> + <edge from-layer="1690" from-port="2" to-layer="1691" to-port="1" /> + <edge from-layer="1691" from-port="2" to-layer="1693" to-port="2" /> + <edge from-layer="1691" from-port="2" to-layer="1721" to-port="2" /> + <edge from-layer="1692" from-port="0" to-layer="1693" to-port="3" /> + <edge from-layer="1693" from-port="4" to-layer="1695" to-port="0" /> + <edge from-layer="1694" from-port="0" to-layer="1695" to-port="2" /> + <edge from-layer="1695" from-port="3" to-layer="1696" to-port="0" /> + <edge from-layer="1696" from-port="2" to-layer="1733" to-port="1" /> + <edge from-layer="1696" from-port="2" to-layer="1697" to-port="1" /> + <edge from-layer="1697" from-port="2" to-layer="1726" to-port="0" /> + <edge from-layer="1698" from-port="0" to-layer="1708" to-port="0" /> + <edge from-layer="1699" from-port="0" to-layer="1708" to-port="1" /> + <edge from-layer="1700" from-port="1" to-layer="1702" to-port="0" /> + <edge from-layer="1701" from-port="0" to-layer="1702" to-port="2" /> + <edge from-layer="1702" from-port="3" to-layer="1703" to-port="0" /> + <edge from-layer="1703" from-port="2" to-layer="1704" to-port="0" /> + <edge from-layer="1704" from-port="1" to-layer="1706" to-port="0" /> + <edge from-layer="1705" from-port="0" to-layer="1706" to-port="1" /> + <edge from-layer="1706" from-port="2" to-layer="1708" to-port="2" /> + <edge from-layer="1707" from-port="0" to-layer="1708" to-port="3" /> + <edge from-layer="1708" from-port="4" to-layer="1716" to-port="2" /> + <edge from-layer="1708" from-port="4" to-layer="1711" to-port="1" /> + <edge from-layer="1709" from-port="0" to-layer="1711" to-port="2" /> + <edge from-layer="1710" from-port="0" to-layer="1711" to-port="3" /> + <edge from-layer="1711" from-port="4" to-layer="1713" to-port="0" /> + <edge from-layer="1712" from-port="0" to-layer="1713" to-port="1" /> + <edge from-layer="1713" from-port="2" to-layer="1717" to-port="0" /> + <edge from-layer="1714" from-port="0" to-layer="1716" to-port="1" /> + <edge from-layer="1715" from-port="0" to-layer="1716" to-port="3" /> + <edge from-layer="1716" from-port="4" to-layer="1717" to-port="1" /> + <edge from-layer="1717" from-port="2" to-layer="1725" to-port="0" /> + <edge from-layer="1718" from-port="0" to-layer="1721" to-port="0" /> + <edge from-layer="1719" from-port="0" to-layer="1721" to-port="1" /> + <edge from-layer="1720" from-port="0" to-layer="1721" to-port="3" /> + <edge from-layer="1721" from-port="4" to-layer="1723" to-port="0" /> + <edge from-layer="1722" from-port="0" to-layer="1723" to-port="2" /> + <edge from-layer="1723" from-port="3" to-layer="1724" to-port="0" /> + <edge from-layer="1724" from-port="2" to-layer="1725" to-port="1" /> + <edge from-layer="1724" from-port="2" to-layer="1754" to-port="1" /> + <edge from-layer="1725" from-port="2" to-layer="1726" to-port="1" /> + <edge from-layer="1726" from-port="2" to-layer="1817" to-port="0" /> + <edge from-layer="1726" from-port="2" to-layer="1781" to-port="0" /> + <edge from-layer="1727" from-port="0" to-layer="1728" to-port="1" /> + <edge from-layer="1728" from-port="2" to-layer="1732" to-port="0" /> + <edge from-layer="1729" from-port="0" to-layer="1732" to-port="1" /> + <edge from-layer="1730" from-port="0" to-layer="1732" to-port="2" /> + <edge from-layer="1731" from-port="0" to-layer="1732" to-port="3" /> + <edge from-layer="1732" from-port="4" to-layer="1733" to-port="0" /> + <edge from-layer="1732" from-port="4" to-layer="1736" to-port="0" /> + <edge from-layer="1732" from-port="4" to-layer="1752" to-port="0" /> + <edge from-layer="1732" from-port="4" to-layer="1747" to-port="0" /> + <edge from-layer="1733" from-port="2" to-layer="1755" to-port="0" /> + <edge from-layer="1734" from-port="0" to-layer="1744" to-port="0" /> + <edge from-layer="1735" from-port="0" to-layer="1744" to-port="1" /> + <edge from-layer="1736" from-port="1" to-layer="1738" to-port="0" /> + <edge from-layer="1737" from-port="0" to-layer="1738" to-port="2" /> + <edge from-layer="1738" from-port="3" to-layer="1739" to-port="0" /> + <edge from-layer="1739" from-port="2" to-layer="1740" to-port="0" /> + <edge from-layer="1740" from-port="1" to-layer="1742" to-port="0" /> + <edge from-layer="1741" from-port="0" to-layer="1742" to-port="1" /> + <edge from-layer="1742" from-port="2" to-layer="1744" to-port="2" /> + <edge from-layer="1743" from-port="0" to-layer="1744" to-port="3" /> + <edge from-layer="1744" from-port="4" to-layer="1747" to-port="1" /> + <edge from-layer="1744" from-port="4" to-layer="1752" to-port="2" /> + <edge from-layer="1745" from-port="0" to-layer="1747" to-port="2" /> + <edge from-layer="1746" from-port="0" to-layer="1747" to-port="3" /> + <edge from-layer="1747" from-port="4" to-layer="1749" to-port="0" /> + <edge from-layer="1748" from-port="0" to-layer="1749" to-port="1" /> + <edge from-layer="1749" from-port="2" to-layer="1753" to-port="0" /> + <edge from-layer="1750" from-port="0" to-layer="1752" to-port="1" /> + <edge from-layer="1751" from-port="0" to-layer="1752" to-port="3" /> + <edge from-layer="1752" from-port="4" to-layer="1753" to-port="1" /> + <edge from-layer="1753" from-port="2" to-layer="1754" to-port="0" /> + <edge from-layer="1754" from-port="2" to-layer="1755" to-port="1" /> + <edge from-layer="1755" from-port="2" to-layer="1756" to-port="1" /> + <edge from-layer="1755" from-port="2" to-layer="1776" to-port="0" /> + <edge from-layer="1756" from-port="2" to-layer="2190" to-port="0" /> + <edge from-layer="1756" from-port="2" to-layer="1817" to-port="1" /> + <edge from-layer="1757" from-port="0" to-layer="1762" to-port="0" /> + <edge from-layer="1758" from-port="0" to-layer="1761" to-port="1" /> + <edge from-layer="1759" from-port="0" to-layer="1761" to-port="2" /> + <edge from-layer="1760" from-port="0" to-layer="1761" to-port="3" /> + <edge from-layer="1761" from-port="4" to-layer="1762" to-port="1" /> + <edge from-layer="1762" from-port="2" to-layer="1763" to-port="0" /> + <edge from-layer="1763" from-port="1" to-layer="1765" to-port="0" /> + <edge from-layer="1764" from-port="0" to-layer="1765" to-port="2" /> + <edge from-layer="1765" from-port="3" to-layer="1772" to-port="0" /> + <edge from-layer="1766" from-port="0" to-layer="1769" to-port="1" /> + <edge from-layer="1767" from-port="0" to-layer="1769" to-port="2" /> + <edge from-layer="1768" from-port="0" to-layer="1769" to-port="3" /> + <edge from-layer="1769" from-port="4" to-layer="1771" to-port="0" /> + <edge from-layer="1770" from-port="0" to-layer="1771" to-port="1" /> + <edge from-layer="1771" from-port="2" to-layer="1772" to-port="1" /> + <edge from-layer="1772" from-port="2" to-layer="1817" to-port="2" /> + <edge from-layer="1772" from-port="2" to-layer="2189" to-port="0" /> + <edge from-layer="1773" from-port="0" to-layer="1795" to-port="0" /> + <edge from-layer="1774" from-port="0" to-layer="1789" to-port="0" /> + <edge from-layer="1775" from-port="0" to-layer="1793" to-port="1" /> + <edge from-layer="1775" from-port="0" to-layer="1789" to-port="1" /> + <edge from-layer="1776" from-port="1" to-layer="1779" to-port="0" /> + <edge from-layer="1777" from-port="0" to-layer="1779" to-port="1" /> + <edge from-layer="1778" from-port="0" to-layer="1779" to-port="2" /> + <edge from-layer="1779" from-port="3" to-layer="1780" to-port="1" /> + <edge from-layer="1780" from-port="2" to-layer="1785" to-port="0" /> + <edge from-layer="1780" from-port="2" to-layer="1792" to-port="0" /> + <edge from-layer="1781" from-port="1" to-layer="1784" to-port="0" /> + <edge from-layer="1781" from-port="1" to-layer="1810" to-port="0" /> + <edge from-layer="1782" from-port="0" to-layer="1784" to-port="1" /> + <edge from-layer="1783" from-port="0" to-layer="1784" to-port="2" /> + <edge from-layer="1784" from-port="3" to-layer="1785" to-port="1" /> + <edge from-layer="1785" from-port="2" to-layer="1787" to-port="0" /> + <edge from-layer="1786" from-port="0" to-layer="1787" to-port="1" /> + <edge from-layer="1787" from-port="2" to-layer="1789" to-port="2" /> + <edge from-layer="1788" from-port="0" to-layer="1793" to-port="3" /> + <edge from-layer="1788" from-port="0" to-layer="1789" to-port="3" /> + <edge from-layer="1789" from-port="4" to-layer="1795" to-port="1" /> + <edge from-layer="1790" from-port="0" to-layer="1793" to-port="0" /> + <edge from-layer="1791" from-port="0" to-layer="1792" to-port="1" /> + <edge from-layer="1792" from-port="2" to-layer="1793" to-port="2" /> + <edge from-layer="1792" from-port="2" to-layer="1800" to-port="2" /> + <edge from-layer="1793" from-port="4" to-layer="1795" to-port="2" /> + <edge from-layer="1794" from-port="0" to-layer="1795" to-port="3" /> + <edge from-layer="1795" from-port="4" to-layer="1802" to-port="0" /> + <edge from-layer="1796" from-port="0" to-layer="1802" to-port="1" /> + <edge from-layer="1797" from-port="0" to-layer="1800" to-port="0" /> + <edge from-layer="1798" from-port="0" to-layer="1800" to-port="1" /> + <edge from-layer="1799" from-port="0" to-layer="1800" to-port="3" /> + <edge from-layer="1800" from-port="4" to-layer="1802" to-port="2" /> + <edge from-layer="1801" from-port="0" to-layer="1802" to-port="3" /> + <edge from-layer="1802" from-port="4" to-layer="1805" to-port="0" /> + <edge from-layer="1803" from-port="0" to-layer="1805" to-port="1" /> + <edge from-layer="1804" from-port="0" to-layer="1805" to-port="2" /> + <edge from-layer="1805" from-port="3" to-layer="1806" to-port="0" /> + <edge from-layer="1806" from-port="2" to-layer="1816" to-port="0" /> + <edge from-layer="1806" from-port="2" to-layer="1807" to-port="0" /> + <edge from-layer="1807" from-port="1" to-layer="1815" to-port="0" /> + <edge from-layer="1808" from-port="0" to-layer="1810" to-port="1" /> + <edge from-layer="1809" from-port="0" to-layer="1810" to-port="2" /> + <edge from-layer="1810" from-port="3" to-layer="1814" to-port="0" /> + <edge from-layer="1811" from-port="0" to-layer="1814" to-port="1" /> + <edge from-layer="1812" from-port="0" to-layer="1814" to-port="2" /> + <edge from-layer="1813" from-port="0" to-layer="1814" to-port="3" /> + <edge from-layer="1814" from-port="4" to-layer="1815" to-port="1" /> + <edge from-layer="1815" from-port="2" to-layer="1816" to-port="1" /> + <edge from-layer="1816" from-port="2" to-layer="1817" to-port="3" /> + <edge from-layer="1817" from-port="4" to-layer="1819" to-port="0" /> + <edge from-layer="1818" from-port="0" to-layer="1819" to-port="1" /> + <edge from-layer="1819" from-port="2" to-layer="1821" to-port="0" /> + <edge from-layer="1820" from-port="0" to-layer="1821" to-port="1" /> + <edge from-layer="1821" from-port="2" to-layer="1830" to-port="0" /> + <edge from-layer="1822" from-port="0" to-layer="1823" to-port="0" /> + <edge from-layer="1823" from-port="1" to-layer="1826" to-port="0" /> + <edge from-layer="1824" from-port="0" to-layer="1825" to-port="0" /> + <edge from-layer="1825" from-port="1" to-layer="1826" to-port="1" /> + <edge from-layer="1826" from-port="2" to-layer="1828" to-port="0" /> + <edge from-layer="1827" from-port="0" to-layer="1828" to-port="1" /> + <edge from-layer="1828" from-port="2" to-layer="1829" to-port="0" /> + <edge from-layer="1829" from-port="1" to-layer="1830" to-port="1" /> + <edge from-layer="1830" from-port="2" to-layer="1832" to-port="0" /> + <edge from-layer="1831" from-port="0" to-layer="1832" to-port="1" /> + <edge from-layer="1832" from-port="2" to-layer="1833" to-port="0" /> + <edge from-layer="1833" from-port="2" to-layer="1835" to-port="0" /> + <edge from-layer="1833" from-port="2" to-layer="1863" to-port="1" /> + <edge from-layer="1834" from-port="0" to-layer="1835" to-port="1" /> + <edge from-layer="1835" from-port="2" to-layer="1837" to-port="0" /> + <edge from-layer="1836" from-port="0" to-layer="1837" to-port="1" /> + <edge from-layer="1837" from-port="2" to-layer="1839" to-port="0" /> + <edge from-layer="1838" from-port="0" to-layer="1839" to-port="1" /> + <edge from-layer="1839" from-port="2" to-layer="1848" to-port="0" /> + <edge from-layer="1840" from-port="0" to-layer="1841" to-port="0" /> + <edge from-layer="1841" from-port="1" to-layer="1844" to-port="0" /> + <edge from-layer="1842" from-port="0" to-layer="1843" to-port="0" /> + <edge from-layer="1843" from-port="1" to-layer="1844" to-port="1" /> + <edge from-layer="1844" from-port="2" to-layer="1846" to-port="0" /> + <edge from-layer="1845" from-port="0" to-layer="1846" to-port="1" /> + <edge from-layer="1846" from-port="2" to-layer="1847" to-port="0" /> + <edge from-layer="1847" from-port="1" to-layer="1848" to-port="1" /> + <edge from-layer="1848" from-port="2" to-layer="1850" to-port="0" /> + <edge from-layer="1849" from-port="0" to-layer="1850" to-port="1" /> + <edge from-layer="1850" from-port="2" to-layer="1851" to-port="0" /> + <edge from-layer="1851" from-port="1" to-layer="1860" to-port="0" /> + <edge from-layer="1852" from-port="0" to-layer="1853" to-port="0" /> + <edge from-layer="1853" from-port="1" to-layer="1856" to-port="0" /> + <edge from-layer="1854" from-port="0" to-layer="1855" to-port="0" /> + <edge from-layer="1855" from-port="1" to-layer="1856" to-port="1" /> + <edge from-layer="1856" from-port="2" to-layer="1858" to-port="0" /> + <edge from-layer="1857" from-port="0" to-layer="1858" to-port="1" /> + <edge from-layer="1858" from-port="2" to-layer="1859" to-port="0" /> + <edge from-layer="1859" from-port="1" to-layer="1860" to-port="1" /> + <edge from-layer="1860" from-port="2" to-layer="1862" to-port="0" /> + <edge from-layer="1861" from-port="0" to-layer="1862" to-port="1" /> + <edge from-layer="1862" from-port="2" to-layer="1863" to-port="0" /> + <edge from-layer="1863" from-port="2" to-layer="1865" to-port="0" /> + <edge from-layer="1863" from-port="2" to-layer="2060" to-port="1" /> + <edge from-layer="1864" from-port="0" to-layer="1865" to-port="1" /> + <edge from-layer="1865" from-port="2" to-layer="1867" to-port="0" /> + <edge from-layer="1866" from-port="0" to-layer="1867" to-port="1" /> + <edge from-layer="1867" from-port="2" to-layer="1869" to-port="0" /> + <edge from-layer="1868" from-port="0" to-layer="1869" to-port="1" /> + <edge from-layer="1869" from-port="2" to-layer="1878" to-port="0" /> + <edge from-layer="1870" from-port="0" to-layer="1871" to-port="0" /> + <edge from-layer="1871" from-port="1" to-layer="1874" to-port="0" /> + <edge from-layer="1872" from-port="0" to-layer="1873" to-port="0" /> + <edge from-layer="1873" from-port="1" to-layer="1874" to-port="1" /> + <edge from-layer="1874" from-port="2" to-layer="1876" to-port="0" /> + <edge from-layer="1875" from-port="0" to-layer="1876" to-port="1" /> + <edge from-layer="1876" from-port="2" to-layer="1877" to-port="0" /> + <edge from-layer="1877" from-port="1" to-layer="1878" to-port="1" /> + <edge from-layer="1878" from-port="2" to-layer="1880" to-port="0" /> + <edge from-layer="1879" from-port="0" to-layer="1880" to-port="1" /> + <edge from-layer="1880" from-port="2" to-layer="1882" to-port="0" /> + <edge from-layer="1881" from-port="0" to-layer="1882" to-port="1" /> + <edge from-layer="1882" from-port="2" to-layer="1886" to-port="0" /> + <edge from-layer="1882" from-port="2" to-layer="1898" to-port="0" /> + <edge from-layer="1882" from-port="2" to-layer="1996" to-port="0" /> + <edge from-layer="1883" from-port="0" to-layer="1886" to-port="1" /> + <edge from-layer="1884" from-port="0" to-layer="1886" to-port="2" /> + <edge from-layer="1885" from-port="0" to-layer="1886" to-port="3" /> + <edge from-layer="1886" from-port="4" to-layer="1888" to-port="0" /> + <edge from-layer="1887" from-port="0" to-layer="1888" to-port="1" /> + <edge from-layer="1888" from-port="2" to-layer="1892" to-port="0" /> + <edge from-layer="1889" from-port="0" to-layer="1892" to-port="1" /> + <edge from-layer="1890" from-port="0" to-layer="1892" to-port="2" /> + <edge from-layer="1891" from-port="0" to-layer="1892" to-port="3" /> + <edge from-layer="1892" from-port="4" to-layer="1938" to-port="0" /> + <edge from-layer="1892" from-port="4" to-layer="1943" to-port="0" /> + <edge from-layer="1892" from-port="4" to-layer="1924" to-port="0" /> + <edge from-layer="1892" from-port="4" to-layer="1927" to-port="0" /> + <edge from-layer="1893" from-port="0" to-layer="1920" to-port="0" /> + <edge from-layer="1894" from-port="0" to-layer="1920" to-port="1" /> + <edge from-layer="1895" from-port="0" to-layer="1898" to-port="1" /> + <edge from-layer="1896" from-port="0" to-layer="1898" to-port="2" /> + <edge from-layer="1897" from-port="0" to-layer="1898" to-port="3" /> + <edge from-layer="1898" from-port="4" to-layer="1955" to-port="0" /> + <edge from-layer="1898" from-port="4" to-layer="1899" to-port="0" /> + <edge from-layer="1899" from-port="1" to-layer="1902" to-port="0" /> + <edge from-layer="1900" from-port="0" to-layer="1902" to-port="1" /> + <edge from-layer="1901" from-port="0" to-layer="1902" to-port="2" /> + <edge from-layer="1902" from-port="3" to-layer="1918" to-port="0" /> + <edge from-layer="1903" from-port="0" to-layer="1908" to-port="0" /> + <edge from-layer="1904" from-port="0" to-layer="1907" to-port="1" /> + <edge from-layer="1905" from-port="0" to-layer="1907" to-port="2" /> + <edge from-layer="1906" from-port="0" to-layer="1907" to-port="3" /> + <edge from-layer="1907" from-port="4" to-layer="1908" to-port="1" /> + <edge from-layer="1908" from-port="2" to-layer="1909" to-port="0" /> + <edge from-layer="1909" from-port="1" to-layer="1911" to-port="0" /> + <edge from-layer="1910" from-port="0" to-layer="1911" to-port="2" /> + <edge from-layer="1911" from-port="3" to-layer="1983" to-port="0" /> + <edge from-layer="1911" from-port="3" to-layer="1912" to-port="0" /> + <edge from-layer="1912" from-port="1" to-layer="1915" to-port="0" /> + <edge from-layer="1913" from-port="0" to-layer="1915" to-port="1" /> + <edge from-layer="1914" from-port="0" to-layer="1915" to-port="2" /> + <edge from-layer="1915" from-port="3" to-layer="2007" to-port="0" /> + <edge from-layer="1915" from-port="3" to-layer="1917" to-port="0" /> + <edge from-layer="1916" from-port="0" to-layer="1917" to-port="1" /> + <edge from-layer="1917" from-port="2" to-layer="1918" to-port="1" /> + <edge from-layer="1918" from-port="2" to-layer="1948" to-port="2" /> + <edge from-layer="1918" from-port="2" to-layer="1920" to-port="2" /> + <edge from-layer="1919" from-port="0" to-layer="1920" to-port="3" /> + <edge from-layer="1920" from-port="4" to-layer="1922" to-port="0" /> + <edge from-layer="1921" from-port="0" to-layer="1922" to-port="2" /> + <edge from-layer="1922" from-port="3" to-layer="1923" to-port="0" /> + <edge from-layer="1923" from-port="2" to-layer="1960" to-port="1" /> + <edge from-layer="1923" from-port="2" to-layer="1924" to-port="1" /> + <edge from-layer="1924" from-port="2" to-layer="1953" to-port="0" /> + <edge from-layer="1925" from-port="0" to-layer="1935" to-port="0" /> + <edge from-layer="1926" from-port="0" to-layer="1935" to-port="1" /> + <edge from-layer="1927" from-port="1" to-layer="1929" to-port="0" /> + <edge from-layer="1928" from-port="0" to-layer="1929" to-port="2" /> + <edge from-layer="1929" from-port="3" to-layer="1930" to-port="0" /> + <edge from-layer="1930" from-port="2" to-layer="1931" to-port="0" /> + <edge from-layer="1931" from-port="1" to-layer="1933" to-port="0" /> + <edge from-layer="1932" from-port="0" to-layer="1933" to-port="1" /> + <edge from-layer="1933" from-port="2" to-layer="1935" to-port="2" /> + <edge from-layer="1934" from-port="0" to-layer="1935" to-port="3" /> + <edge from-layer="1935" from-port="4" to-layer="1938" to-port="1" /> + <edge from-layer="1935" from-port="4" to-layer="1943" to-port="2" /> + <edge from-layer="1936" from-port="0" to-layer="1938" to-port="2" /> + <edge from-layer="1937" from-port="0" to-layer="1938" to-port="3" /> + <edge from-layer="1938" from-port="4" to-layer="1940" to-port="0" /> + <edge from-layer="1939" from-port="0" to-layer="1940" to-port="1" /> + <edge from-layer="1940" from-port="2" to-layer="1944" to-port="0" /> + <edge from-layer="1941" from-port="0" to-layer="1943" to-port="1" /> + <edge from-layer="1942" from-port="0" to-layer="1943" to-port="3" /> + <edge from-layer="1943" from-port="4" to-layer="1944" to-port="1" /> + <edge from-layer="1944" from-port="2" to-layer="1952" to-port="0" /> + <edge from-layer="1945" from-port="0" to-layer="1948" to-port="0" /> + <edge from-layer="1946" from-port="0" to-layer="1948" to-port="1" /> + <edge from-layer="1947" from-port="0" to-layer="1948" to-port="3" /> + <edge from-layer="1948" from-port="4" to-layer="1950" to-port="0" /> + <edge from-layer="1949" from-port="0" to-layer="1950" to-port="2" /> + <edge from-layer="1950" from-port="3" to-layer="1951" to-port="0" /> + <edge from-layer="1951" from-port="2" to-layer="1952" to-port="1" /> + <edge from-layer="1951" from-port="2" to-layer="1981" to-port="1" /> + <edge from-layer="1952" from-port="2" to-layer="1953" to-port="1" /> + <edge from-layer="1953" from-port="2" to-layer="2044" to-port="0" /> + <edge from-layer="1953" from-port="2" to-layer="2008" to-port="0" /> + <edge from-layer="1954" from-port="0" to-layer="1955" to-port="1" /> + <edge from-layer="1955" from-port="2" to-layer="1959" to-port="0" /> + <edge from-layer="1956" from-port="0" to-layer="1959" to-port="1" /> + <edge from-layer="1957" from-port="0" to-layer="1959" to-port="2" /> + <edge from-layer="1958" from-port="0" to-layer="1959" to-port="3" /> + <edge from-layer="1959" from-port="4" to-layer="1974" to-port="0" /> + <edge from-layer="1959" from-port="4" to-layer="1979" to-port="0" /> + <edge from-layer="1959" from-port="4" to-layer="1963" to-port="0" /> + <edge from-layer="1959" from-port="4" to-layer="1960" to-port="0" /> + <edge from-layer="1960" from-port="2" to-layer="1982" to-port="0" /> + <edge from-layer="1961" from-port="0" to-layer="1971" to-port="0" /> + <edge from-layer="1962" from-port="0" to-layer="1971" to-port="1" /> + <edge from-layer="1963" from-port="1" to-layer="1965" to-port="0" /> + <edge from-layer="1964" from-port="0" to-layer="1965" to-port="2" /> + <edge from-layer="1965" from-port="3" to-layer="1966" to-port="0" /> + <edge from-layer="1966" from-port="2" to-layer="1967" to-port="0" /> + <edge from-layer="1967" from-port="1" to-layer="1969" to-port="0" /> + <edge from-layer="1968" from-port="0" to-layer="1969" to-port="1" /> + <edge from-layer="1969" from-port="2" to-layer="1971" to-port="2" /> + <edge from-layer="1970" from-port="0" to-layer="1971" to-port="3" /> + <edge from-layer="1971" from-port="4" to-layer="1974" to-port="1" /> + <edge from-layer="1971" from-port="4" to-layer="1979" to-port="2" /> + <edge from-layer="1972" from-port="0" to-layer="1974" to-port="2" /> + <edge from-layer="1973" from-port="0" to-layer="1974" to-port="3" /> + <edge from-layer="1974" from-port="4" to-layer="1976" to-port="0" /> + <edge from-layer="1975" from-port="0" to-layer="1976" to-port="1" /> + <edge from-layer="1976" from-port="2" to-layer="1980" to-port="0" /> + <edge from-layer="1977" from-port="0" to-layer="1979" to-port="1" /> + <edge from-layer="1978" from-port="0" to-layer="1979" to-port="3" /> + <edge from-layer="1979" from-port="4" to-layer="1980" to-port="1" /> + <edge from-layer="1980" from-port="2" to-layer="1981" to-port="0" /> + <edge from-layer="1981" from-port="2" to-layer="1982" to-port="1" /> + <edge from-layer="1982" from-port="2" to-layer="2003" to-port="0" /> + <edge from-layer="1982" from-port="2" to-layer="1983" to-port="1" /> + <edge from-layer="1983" from-port="2" to-layer="2188" to-port="0" /> + <edge from-layer="1983" from-port="2" to-layer="2044" to-port="1" /> + <edge from-layer="1984" from-port="0" to-layer="1989" to-port="0" /> + <edge from-layer="1985" from-port="0" to-layer="1988" to-port="1" /> + <edge from-layer="1986" from-port="0" to-layer="1988" to-port="2" /> + <edge from-layer="1987" from-port="0" to-layer="1988" to-port="3" /> + <edge from-layer="1988" from-port="4" to-layer="1989" to-port="1" /> + <edge from-layer="1989" from-port="2" to-layer="1990" to-port="0" /> + <edge from-layer="1990" from-port="1" to-layer="1992" to-port="0" /> + <edge from-layer="1991" from-port="0" to-layer="1992" to-port="2" /> + <edge from-layer="1992" from-port="3" to-layer="1999" to-port="0" /> + <edge from-layer="1993" from-port="0" to-layer="1996" to-port="1" /> + <edge from-layer="1994" from-port="0" to-layer="1996" to-port="2" /> + <edge from-layer="1995" from-port="0" to-layer="1996" to-port="3" /> + <edge from-layer="1996" from-port="4" to-layer="1998" to-port="0" /> + <edge from-layer="1997" from-port="0" to-layer="1998" to-port="1" /> + <edge from-layer="1998" from-port="2" to-layer="1999" to-port="1" /> + <edge from-layer="1999" from-port="2" to-layer="2187" to-port="0" /> + <edge from-layer="1999" from-port="2" to-layer="2044" to-port="2" /> + <edge from-layer="2000" from-port="0" to-layer="2022" to-port="0" /> + <edge from-layer="2001" from-port="0" to-layer="2016" to-port="0" /> + <edge from-layer="2002" from-port="0" to-layer="2016" to-port="1" /> + <edge from-layer="2002" from-port="0" to-layer="2020" to-port="1" /> + <edge from-layer="2003" from-port="1" to-layer="2006" to-port="0" /> + <edge from-layer="2004" from-port="0" to-layer="2006" to-port="1" /> + <edge from-layer="2005" from-port="0" to-layer="2006" to-port="2" /> + <edge from-layer="2006" from-port="3" to-layer="2007" to-port="1" /> + <edge from-layer="2007" from-port="2" to-layer="2012" to-port="0" /> + <edge from-layer="2007" from-port="2" to-layer="2019" to-port="0" /> + <edge from-layer="2008" from-port="1" to-layer="2037" to-port="0" /> + <edge from-layer="2008" from-port="1" to-layer="2011" to-port="0" /> + <edge from-layer="2009" from-port="0" to-layer="2011" to-port="1" /> + <edge from-layer="2010" from-port="0" to-layer="2011" to-port="2" /> + <edge from-layer="2011" from-port="3" to-layer="2012" to-port="1" /> + <edge from-layer="2012" from-port="2" to-layer="2014" to-port="0" /> + <edge from-layer="2013" from-port="0" to-layer="2014" to-port="1" /> + <edge from-layer="2014" from-port="2" to-layer="2016" to-port="2" /> + <edge from-layer="2015" from-port="0" to-layer="2016" to-port="3" /> + <edge from-layer="2015" from-port="0" to-layer="2020" to-port="3" /> + <edge from-layer="2016" from-port="4" to-layer="2022" to-port="1" /> + <edge from-layer="2017" from-port="0" to-layer="2020" to-port="0" /> + <edge from-layer="2018" from-port="0" to-layer="2019" to-port="1" /> + <edge from-layer="2019" from-port="2" to-layer="2027" to-port="2" /> + <edge from-layer="2019" from-port="2" to-layer="2020" to-port="2" /> + <edge from-layer="2020" from-port="4" to-layer="2022" to-port="2" /> + <edge from-layer="2021" from-port="0" to-layer="2022" to-port="3" /> + <edge from-layer="2022" from-port="4" to-layer="2029" to-port="0" /> + <edge from-layer="2023" from-port="0" to-layer="2029" to-port="1" /> + <edge from-layer="2024" from-port="0" to-layer="2027" to-port="0" /> + <edge from-layer="2025" from-port="0" to-layer="2027" to-port="1" /> + <edge from-layer="2026" from-port="0" to-layer="2027" to-port="3" /> + <edge from-layer="2027" from-port="4" to-layer="2029" to-port="2" /> + <edge from-layer="2028" from-port="0" to-layer="2029" to-port="3" /> + <edge from-layer="2029" from-port="4" to-layer="2032" to-port="0" /> + <edge from-layer="2030" from-port="0" to-layer="2032" to-port="1" /> + <edge from-layer="2031" from-port="0" to-layer="2032" to-port="2" /> + <edge from-layer="2032" from-port="3" to-layer="2033" to-port="0" /> + <edge from-layer="2033" from-port="2" to-layer="2034" to-port="0" /> + <edge from-layer="2033" from-port="2" to-layer="2043" to-port="0" /> + <edge from-layer="2034" from-port="1" to-layer="2042" to-port="0" /> + <edge from-layer="2035" from-port="0" to-layer="2037" to-port="1" /> + <edge from-layer="2036" from-port="0" to-layer="2037" to-port="2" /> + <edge from-layer="2037" from-port="3" to-layer="2041" to-port="0" /> + <edge from-layer="2038" from-port="0" to-layer="2041" to-port="1" /> + <edge from-layer="2039" from-port="0" to-layer="2041" to-port="2" /> + <edge from-layer="2040" from-port="0" to-layer="2041" to-port="3" /> + <edge from-layer="2041" from-port="4" to-layer="2042" to-port="1" /> + <edge from-layer="2042" from-port="2" to-layer="2043" to-port="1" /> + <edge from-layer="2043" from-port="2" to-layer="2044" to-port="3" /> + <edge from-layer="2044" from-port="4" to-layer="2046" to-port="0" /> + <edge from-layer="2045" from-port="0" to-layer="2046" to-port="1" /> + <edge from-layer="2046" from-port="2" to-layer="2048" to-port="0" /> + <edge from-layer="2047" from-port="0" to-layer="2048" to-port="1" /> + <edge from-layer="2048" from-port="2" to-layer="2057" to-port="0" /> + <edge from-layer="2049" from-port="0" to-layer="2050" to-port="0" /> + <edge from-layer="2050" from-port="1" to-layer="2053" to-port="0" /> + <edge from-layer="2051" from-port="0" to-layer="2052" to-port="0" /> + <edge from-layer="2052" from-port="1" to-layer="2053" to-port="1" /> + <edge from-layer="2053" from-port="2" to-layer="2055" to-port="0" /> + <edge from-layer="2054" from-port="0" to-layer="2055" to-port="1" /> + <edge from-layer="2055" from-port="2" to-layer="2056" to-port="0" /> + <edge from-layer="2056" from-port="1" to-layer="2057" to-port="1" /> + <edge from-layer="2057" from-port="2" to-layer="2059" to-port="0" /> + <edge from-layer="2058" from-port="0" to-layer="2059" to-port="1" /> + <edge from-layer="2059" from-port="2" to-layer="2060" to-port="0" /> + <edge from-layer="2060" from-port="2" to-layer="2062" to-port="0" /> + <edge from-layer="2060" from-port="2" to-layer="2090" to-port="1" /> + <edge from-layer="2061" from-port="0" to-layer="2062" to-port="1" /> + <edge from-layer="2062" from-port="2" to-layer="2064" to-port="0" /> + <edge from-layer="2063" from-port="0" to-layer="2064" to-port="1" /> + <edge from-layer="2064" from-port="2" to-layer="2066" to-port="0" /> + <edge from-layer="2065" from-port="0" to-layer="2066" to-port="1" /> + <edge from-layer="2066" from-port="2" to-layer="2075" to-port="0" /> + <edge from-layer="2067" from-port="0" to-layer="2068" to-port="0" /> + <edge from-layer="2068" from-port="1" to-layer="2071" to-port="0" /> + <edge from-layer="2069" from-port="0" to-layer="2070" to-port="0" /> + <edge from-layer="2070" from-port="1" to-layer="2071" to-port="1" /> + <edge from-layer="2071" from-port="2" to-layer="2073" to-port="0" /> + <edge from-layer="2072" from-port="0" to-layer="2073" to-port="1" /> + <edge from-layer="2073" from-port="2" to-layer="2074" to-port="0" /> + <edge from-layer="2074" from-port="1" to-layer="2075" to-port="1" /> + <edge from-layer="2075" from-port="2" to-layer="2077" to-port="0" /> + <edge from-layer="2076" from-port="0" to-layer="2077" to-port="1" /> + <edge from-layer="2077" from-port="2" to-layer="2078" to-port="0" /> + <edge from-layer="2078" from-port="1" to-layer="2087" to-port="0" /> + <edge from-layer="2079" from-port="0" to-layer="2080" to-port="0" /> + <edge from-layer="2080" from-port="1" to-layer="2083" to-port="0" /> + <edge from-layer="2081" from-port="0" to-layer="2082" to-port="0" /> + <edge from-layer="2082" from-port="1" to-layer="2083" to-port="1" /> + <edge from-layer="2083" from-port="2" to-layer="2085" to-port="0" /> + <edge from-layer="2084" from-port="0" to-layer="2085" to-port="1" /> + <edge from-layer="2085" from-port="2" to-layer="2086" to-port="0" /> + <edge from-layer="2086" from-port="1" to-layer="2087" to-port="1" /> + <edge from-layer="2087" from-port="2" to-layer="2089" to-port="0" /> + <edge from-layer="2088" from-port="0" to-layer="2089" to-port="1" /> + <edge from-layer="2089" from-port="2" to-layer="2090" to-port="0" /> + <edge from-layer="2090" from-port="2" to-layer="2092" to-port="0" /> + <edge from-layer="2090" from-port="2" to-layer="2299" to-port="1" /> + <edge from-layer="2091" from-port="0" to-layer="2092" to-port="1" /> + <edge from-layer="2092" from-port="2" to-layer="2094" to-port="0" /> + <edge from-layer="2093" from-port="0" to-layer="2094" to-port="1" /> + <edge from-layer="2094" from-port="2" to-layer="2096" to-port="0" /> + <edge from-layer="2095" from-port="0" to-layer="2096" to-port="1" /> + <edge from-layer="2096" from-port="2" to-layer="2105" to-port="0" /> + <edge from-layer="2097" from-port="0" to-layer="2098" to-port="0" /> + <edge from-layer="2098" from-port="1" to-layer="2101" to-port="0" /> + <edge from-layer="2099" from-port="0" to-layer="2100" to-port="0" /> + <edge from-layer="2100" from-port="1" to-layer="2101" to-port="1" /> + <edge from-layer="2101" from-port="2" to-layer="2103" to-port="0" /> + <edge from-layer="2102" from-port="0" to-layer="2103" to-port="1" /> + <edge from-layer="2103" from-port="2" to-layer="2104" to-port="0" /> + <edge from-layer="2104" from-port="1" to-layer="2105" to-port="1" /> + <edge from-layer="2105" from-port="2" to-layer="2107" to-port="0" /> + <edge from-layer="2106" from-port="0" to-layer="2107" to-port="1" /> + <edge from-layer="2107" from-port="2" to-layer="2109" to-port="0" /> + <edge from-layer="2108" from-port="0" to-layer="2109" to-port="1" /> + <edge from-layer="2109" from-port="2" to-layer="2209" to-port="0" /> + <edge from-layer="2109" from-port="2" to-layer="2130" to-port="0" /> + <edge from-layer="2109" from-port="2" to-layer="2113" to-port="0" /> + <edge from-layer="2110" from-port="0" to-layer="2113" to-port="1" /> + <edge from-layer="2111" from-port="0" to-layer="2113" to-port="2" /> + <edge from-layer="2112" from-port="0" to-layer="2113" to-port="3" /> + <edge from-layer="2113" from-port="4" to-layer="2115" to-port="0" /> + <edge from-layer="2114" from-port="0" to-layer="2115" to-port="1" /> + <edge from-layer="2115" from-port="2" to-layer="2116" to-port="1" /> + <edge from-layer="2116" from-port="2" to-layer="2117" to-port="0" /> + <edge from-layer="2116" from-port="2" to-layer="2283" to-port="2" /> + <edge from-layer="2118" from-port="0" to-layer="2123" to-port="0" /> + <edge from-layer="2119" from-port="0" to-layer="2122" to-port="1" /> + <edge from-layer="2120" from-port="0" to-layer="2122" to-port="2" /> + <edge from-layer="2121" from-port="0" to-layer="2122" to-port="3" /> + <edge from-layer="2122" from-port="4" to-layer="2123" to-port="1" /> + <edge from-layer="2123" from-port="2" to-layer="2124" to-port="0" /> + <edge from-layer="2124" from-port="1" to-layer="2126" to-port="0" /> + <edge from-layer="2125" from-port="0" to-layer="2126" to-port="2" /> + <edge from-layer="2126" from-port="3" to-layer="2185" to-port="0" /> + <edge from-layer="2126" from-port="3" to-layer="2143" to-port="0" /> + <edge from-layer="2127" from-port="0" to-layer="2130" to-port="1" /> + <edge from-layer="2128" from-port="0" to-layer="2130" to-port="2" /> + <edge from-layer="2129" from-port="0" to-layer="2130" to-port="3" /> + <edge from-layer="2130" from-port="4" to-layer="2132" to-port="0" /> + <edge from-layer="2130" from-port="4" to-layer="2139" to-port="0" /> + <edge from-layer="2131" from-port="0" to-layer="2132" to-port="1" /> + <edge from-layer="2132" from-port="2" to-layer="2136" to-port="0" /> + <edge from-layer="2133" from-port="0" to-layer="2136" to-port="1" /> + <edge from-layer="2134" from-port="0" to-layer="2136" to-port="2" /> + <edge from-layer="2135" from-port="0" to-layer="2136" to-port="3" /> + <edge from-layer="2136" from-port="4" to-layer="2169" to-port="0" /> + <edge from-layer="2136" from-port="4" to-layer="2174" to-port="0" /> + <edge from-layer="2136" from-port="4" to-layer="2158" to-port="0" /> + <edge from-layer="2136" from-port="4" to-layer="2155" to-port="0" /> + <edge from-layer="2137" from-port="0" to-layer="2151" to-port="0" /> + <edge from-layer="2138" from-port="0" to-layer="2151" to-port="1" /> + <edge from-layer="2139" from-port="1" to-layer="2142" to-port="0" /> + <edge from-layer="2140" from-port="0" to-layer="2142" to-port="1" /> + <edge from-layer="2141" from-port="0" to-layer="2142" to-port="2" /> + <edge from-layer="2142" from-port="3" to-layer="2149" to-port="0" /> + <edge from-layer="2143" from-port="1" to-layer="2146" to-port="0" /> + <edge from-layer="2144" from-port="0" to-layer="2146" to-port="1" /> + <edge from-layer="2145" from-port="0" to-layer="2146" to-port="2" /> + <edge from-layer="2146" from-port="3" to-layer="2246" to-port="0" /> + <edge from-layer="2146" from-port="3" to-layer="2148" to-port="0" /> + <edge from-layer="2147" from-port="0" to-layer="2148" to-port="1" /> + <edge from-layer="2148" from-port="2" to-layer="2149" to-port="1" /> + <edge from-layer="2149" from-port="2" to-layer="2151" to-port="2" /> + <edge from-layer="2149" from-port="2" to-layer="2179" to-port="2" /> + <edge from-layer="2150" from-port="0" to-layer="2151" to-port="3" /> + <edge from-layer="2151" from-port="4" to-layer="2153" to-port="0" /> + <edge from-layer="2152" from-port="0" to-layer="2153" to-port="2" /> + <edge from-layer="2153" from-port="3" to-layer="2154" to-port="0" /> + <edge from-layer="2154" from-port="2" to-layer="2155" to-port="1" /> + <edge from-layer="2154" from-port="2" to-layer="2216" to-port="1" /> + <edge from-layer="2155" from-port="2" to-layer="2184" to-port="0" /> + <edge from-layer="2156" from-port="0" to-layer="2166" to-port="0" /> + <edge from-layer="2157" from-port="0" to-layer="2166" to-port="1" /> + <edge from-layer="2158" from-port="1" to-layer="2160" to-port="0" /> + <edge from-layer="2159" from-port="0" to-layer="2160" to-port="2" /> + <edge from-layer="2160" from-port="3" to-layer="2161" to-port="0" /> + <edge from-layer="2161" from-port="2" to-layer="2162" to-port="0" /> + <edge from-layer="2162" from-port="1" to-layer="2164" to-port="0" /> + <edge from-layer="2163" from-port="0" to-layer="2164" to-port="1" /> + <edge from-layer="2164" from-port="2" to-layer="2166" to-port="2" /> + <edge from-layer="2165" from-port="0" to-layer="2166" to-port="3" /> + <edge from-layer="2166" from-port="4" to-layer="2169" to-port="1" /> + <edge from-layer="2166" from-port="4" to-layer="2174" to-port="2" /> + <edge from-layer="2167" from-port="0" to-layer="2169" to-port="2" /> + <edge from-layer="2168" from-port="0" to-layer="2169" to-port="3" /> + <edge from-layer="2169" from-port="4" to-layer="2171" to-port="0" /> + <edge from-layer="2170" from-port="0" to-layer="2171" to-port="1" /> + <edge from-layer="2171" from-port="2" to-layer="2175" to-port="0" /> + <edge from-layer="2172" from-port="0" to-layer="2174" to-port="1" /> + <edge from-layer="2173" from-port="0" to-layer="2174" to-port="3" /> + <edge from-layer="2174" from-port="4" to-layer="2175" to-port="1" /> + <edge from-layer="2175" from-port="2" to-layer="2183" to-port="0" /> + <edge from-layer="2176" from-port="0" to-layer="2179" to-port="0" /> + <edge from-layer="2177" from-port="0" to-layer="2179" to-port="1" /> + <edge from-layer="2178" from-port="0" to-layer="2179" to-port="3" /> + <edge from-layer="2179" from-port="4" to-layer="2181" to-port="0" /> + <edge from-layer="2180" from-port="0" to-layer="2181" to-port="2" /> + <edge from-layer="2181" from-port="3" to-layer="2182" to-port="0" /> + <edge from-layer="2182" from-port="2" to-layer="2237" to-port="1" /> + <edge from-layer="2182" from-port="2" to-layer="2183" to-port="1" /> + <edge from-layer="2183" from-port="2" to-layer="2184" to-port="1" /> + <edge from-layer="2184" from-port="2" to-layer="2185" to-port="1" /> + <edge from-layer="2184" from-port="2" to-layer="2242" to-port="0" /> + <edge from-layer="2185" from-port="2" to-layer="2186" to-port="0" /> + <edge from-layer="2185" from-port="2" to-layer="2283" to-port="1" /> + <edge from-layer="2197" from-port="0" to-layer="2202" to-port="0" /> + <edge from-layer="2198" from-port="0" to-layer="2201" to-port="1" /> + <edge from-layer="2199" from-port="0" to-layer="2201" to-port="2" /> + <edge from-layer="2200" from-port="0" to-layer="2201" to-port="3" /> + <edge from-layer="2201" from-port="4" to-layer="2202" to-port="1" /> + <edge from-layer="2202" from-port="2" to-layer="2203" to-port="0" /> + <edge from-layer="2203" from-port="1" to-layer="2205" to-port="0" /> + <edge from-layer="2204" from-port="0" to-layer="2205" to-port="2" /> + <edge from-layer="2205" from-port="3" to-layer="7277" to-port="0" /> + <edge from-layer="2205" from-port="3" to-layer="7122" to-port="0" /> + <edge from-layer="2206" from-port="0" to-layer="2209" to-port="1" /> + <edge from-layer="2207" from-port="0" to-layer="2209" to-port="2" /> + <edge from-layer="2208" from-port="0" to-layer="2209" to-port="3" /> + <edge from-layer="2209" from-port="4" to-layer="2211" to-port="0" /> + <edge from-layer="2210" from-port="0" to-layer="2211" to-port="1" /> + <edge from-layer="2211" from-port="2" to-layer="2215" to-port="0" /> + <edge from-layer="2212" from-port="0" to-layer="2215" to-port="1" /> + <edge from-layer="2213" from-port="0" to-layer="2215" to-port="2" /> + <edge from-layer="2214" from-port="0" to-layer="2215" to-port="3" /> + <edge from-layer="2215" from-port="4" to-layer="2235" to-port="0" /> + <edge from-layer="2215" from-port="4" to-layer="2219" to-port="0" /> + <edge from-layer="2215" from-port="4" to-layer="2216" to-port="0" /> + <edge from-layer="2215" from-port="4" to-layer="2230" to-port="0" /> + <edge from-layer="2216" from-port="2" to-layer="2238" to-port="0" /> + <edge from-layer="2217" from-port="0" to-layer="2227" to-port="0" /> + <edge from-layer="2218" from-port="0" to-layer="2227" to-port="1" /> + <edge from-layer="2219" from-port="1" to-layer="2221" to-port="0" /> + <edge from-layer="2220" from-port="0" to-layer="2221" to-port="2" /> + <edge from-layer="2221" from-port="3" to-layer="2222" to-port="0" /> + <edge from-layer="2222" from-port="2" to-layer="2223" to-port="0" /> + <edge from-layer="2223" from-port="1" to-layer="2225" to-port="0" /> + <edge from-layer="2224" from-port="0" to-layer="2225" to-port="1" /> + <edge from-layer="2225" from-port="2" to-layer="2227" to-port="2" /> + <edge from-layer="2226" from-port="0" to-layer="2227" to-port="3" /> + <edge from-layer="2227" from-port="4" to-layer="2230" to-port="1" /> + <edge from-layer="2227" from-port="4" to-layer="2235" to-port="2" /> + <edge from-layer="2228" from-port="0" to-layer="2230" to-port="2" /> + <edge from-layer="2229" from-port="0" to-layer="2230" to-port="3" /> + <edge from-layer="2230" from-port="4" to-layer="2232" to-port="0" /> + <edge from-layer="2231" from-port="0" to-layer="2232" to-port="1" /> + <edge from-layer="2232" from-port="2" to-layer="2236" to-port="0" /> + <edge from-layer="2233" from-port="0" to-layer="2235" to-port="1" /> + <edge from-layer="2234" from-port="0" to-layer="2235" to-port="3" /> + <edge from-layer="2235" from-port="4" to-layer="2236" to-port="1" /> + <edge from-layer="2236" from-port="2" to-layer="2237" to-port="0" /> + <edge from-layer="2237" from-port="2" to-layer="2238" to-port="1" /> + <edge from-layer="2238" from-port="2" to-layer="2247" to-port="0" /> + <edge from-layer="2238" from-port="2" to-layer="2283" to-port="0" /> + <edge from-layer="2239" from-port="0" to-layer="2261" to-port="0" /> + <edge from-layer="2240" from-port="0" to-layer="2255" to-port="0" /> + <edge from-layer="2241" from-port="0" to-layer="2259" to-port="1" /> + <edge from-layer="2241" from-port="0" to-layer="2255" to-port="1" /> + <edge from-layer="2242" from-port="1" to-layer="2245" to-port="0" /> + <edge from-layer="2243" from-port="0" to-layer="2245" to-port="1" /> + <edge from-layer="2244" from-port="0" to-layer="2245" to-port="2" /> + <edge from-layer="2245" from-port="3" to-layer="2246" to-port="1" /> + <edge from-layer="2246" from-port="2" to-layer="2258" to-port="0" /> + <edge from-layer="2246" from-port="2" to-layer="2251" to-port="0" /> + <edge from-layer="2247" from-port="1" to-layer="2276" to-port="0" /> + <edge from-layer="2247" from-port="1" to-layer="2250" to-port="0" /> + <edge from-layer="2248" from-port="0" to-layer="2250" to-port="1" /> + <edge from-layer="2249" from-port="0" to-layer="2250" to-port="2" /> + <edge from-layer="2250" from-port="3" to-layer="2251" to-port="1" /> + <edge from-layer="2251" from-port="2" to-layer="2253" to-port="0" /> + <edge from-layer="2252" from-port="0" to-layer="2253" to-port="1" /> + <edge from-layer="2253" from-port="2" to-layer="2255" to-port="2" /> + <edge from-layer="2254" from-port="0" to-layer="2255" to-port="3" /> + <edge from-layer="2254" from-port="0" to-layer="2259" to-port="3" /> + <edge from-layer="2255" from-port="4" to-layer="2261" to-port="1" /> + <edge from-layer="2256" from-port="0" to-layer="2259" to-port="0" /> + <edge from-layer="2257" from-port="0" to-layer="2258" to-port="1" /> + <edge from-layer="2258" from-port="2" to-layer="2266" to-port="2" /> + <edge from-layer="2258" from-port="2" to-layer="2259" to-port="2" /> + <edge from-layer="2259" from-port="4" to-layer="2261" to-port="2" /> + <edge from-layer="2260" from-port="0" to-layer="2261" to-port="3" /> + <edge from-layer="2261" from-port="4" to-layer="2268" to-port="0" /> + <edge from-layer="2262" from-port="0" to-layer="2268" to-port="1" /> + <edge from-layer="2263" from-port="0" to-layer="2266" to-port="0" /> + <edge from-layer="2264" from-port="0" to-layer="2266" to-port="1" /> + <edge from-layer="2265" from-port="0" to-layer="2266" to-port="3" /> + <edge from-layer="2266" from-port="4" to-layer="2268" to-port="2" /> + <edge from-layer="2267" from-port="0" to-layer="2268" to-port="3" /> + <edge from-layer="2268" from-port="4" to-layer="2271" to-port="0" /> + <edge from-layer="2269" from-port="0" to-layer="2271" to-port="1" /> + <edge from-layer="2270" from-port="0" to-layer="2271" to-port="2" /> + <edge from-layer="2271" from-port="3" to-layer="2272" to-port="0" /> + <edge from-layer="2272" from-port="2" to-layer="2282" to-port="0" /> + <edge from-layer="2272" from-port="2" to-layer="2273" to-port="0" /> + <edge from-layer="2273" from-port="1" to-layer="2281" to-port="0" /> + <edge from-layer="2274" from-port="0" to-layer="2276" to-port="1" /> + <edge from-layer="2275" from-port="0" to-layer="2276" to-port="2" /> + <edge from-layer="2276" from-port="3" to-layer="2280" to-port="0" /> + <edge from-layer="2277" from-port="0" to-layer="2280" to-port="1" /> + <edge from-layer="2278" from-port="0" to-layer="2280" to-port="2" /> + <edge from-layer="2279" from-port="0" to-layer="2280" to-port="3" /> + <edge from-layer="2280" from-port="4" to-layer="2281" to-port="1" /> + <edge from-layer="2281" from-port="2" to-layer="2282" to-port="1" /> + <edge from-layer="2282" from-port="2" to-layer="2283" to-port="3" /> + <edge from-layer="2283" from-port="4" to-layer="2285" to-port="0" /> + <edge from-layer="2284" from-port="0" to-layer="2285" to-port="1" /> + <edge from-layer="2285" from-port="2" to-layer="2287" to-port="0" /> + <edge from-layer="2286" from-port="0" to-layer="2287" to-port="1" /> + <edge from-layer="2287" from-port="2" to-layer="2296" to-port="0" /> + <edge from-layer="2288" from-port="0" to-layer="2289" to-port="0" /> + <edge from-layer="2289" from-port="1" to-layer="2292" to-port="0" /> + <edge from-layer="2290" from-port="0" to-layer="2291" to-port="0" /> + <edge from-layer="2291" from-port="1" to-layer="2292" to-port="1" /> + <edge from-layer="2292" from-port="2" to-layer="2294" to-port="0" /> + <edge from-layer="2293" from-port="0" to-layer="2294" to-port="1" /> + <edge from-layer="2294" from-port="2" to-layer="2295" to-port="0" /> + <edge from-layer="2295" from-port="1" to-layer="2296" to-port="1" /> + <edge from-layer="2296" from-port="2" to-layer="2298" to-port="0" /> + <edge from-layer="2297" from-port="0" to-layer="2298" to-port="1" /> + <edge from-layer="2298" from-port="2" to-layer="2299" to-port="0" /> + <edge from-layer="2299" from-port="2" to-layer="2301" to-port="0" /> + <edge from-layer="2299" from-port="2" to-layer="2329" to-port="1" /> + <edge from-layer="2300" from-port="0" to-layer="2301" to-port="1" /> + <edge from-layer="2301" from-port="2" to-layer="2303" to-port="0" /> + <edge from-layer="2302" from-port="0" to-layer="2303" to-port="1" /> + <edge from-layer="2303" from-port="2" to-layer="2305" to-port="0" /> + <edge from-layer="2304" from-port="0" to-layer="2305" to-port="1" /> + <edge from-layer="2305" from-port="2" to-layer="2314" to-port="0" /> + <edge from-layer="2306" from-port="0" to-layer="2307" to-port="0" /> + <edge from-layer="2307" from-port="1" to-layer="2310" to-port="0" /> + <edge from-layer="2308" from-port="0" to-layer="2309" to-port="0" /> + <edge from-layer="2309" from-port="1" to-layer="2310" to-port="1" /> + <edge from-layer="2310" from-port="2" to-layer="2312" to-port="0" /> + <edge from-layer="2311" from-port="0" to-layer="2312" to-port="1" /> + <edge from-layer="2312" from-port="2" to-layer="2313" to-port="0" /> + <edge from-layer="2313" from-port="1" to-layer="2314" to-port="1" /> + <edge from-layer="2314" from-port="2" to-layer="2316" to-port="0" /> + <edge from-layer="2315" from-port="0" to-layer="2316" to-port="1" /> + <edge from-layer="2316" from-port="2" to-layer="2317" to-port="0" /> + <edge from-layer="2317" from-port="1" to-layer="2326" to-port="0" /> + <edge from-layer="2318" from-port="0" to-layer="2319" to-port="0" /> + <edge from-layer="2319" from-port="1" to-layer="2322" to-port="0" /> + <edge from-layer="2320" from-port="0" to-layer="2321" to-port="0" /> + <edge from-layer="2321" from-port="1" to-layer="2322" to-port="1" /> + <edge from-layer="2322" from-port="2" to-layer="2324" to-port="0" /> + <edge from-layer="2323" from-port="0" to-layer="2324" to-port="1" /> + <edge from-layer="2324" from-port="2" to-layer="2325" to-port="0" /> + <edge from-layer="2325" from-port="1" to-layer="2326" to-port="1" /> + <edge from-layer="2326" from-port="2" to-layer="2328" to-port="0" /> + <edge from-layer="2327" from-port="0" to-layer="2328" to-port="1" /> + <edge from-layer="2328" from-port="2" to-layer="2329" to-port="0" /> + <edge from-layer="2329" from-port="2" to-layer="2526" to-port="1" /> + <edge from-layer="2329" from-port="2" to-layer="2331" to-port="0" /> + <edge from-layer="2330" from-port="0" to-layer="2331" to-port="1" /> + <edge from-layer="2331" from-port="2" to-layer="2333" to-port="0" /> + <edge from-layer="2332" from-port="0" to-layer="2333" to-port="1" /> + <edge from-layer="2333" from-port="2" to-layer="2335" to-port="0" /> + <edge from-layer="2334" from-port="0" to-layer="2335" to-port="1" /> + <edge from-layer="2335" from-port="2" to-layer="2344" to-port="0" /> + <edge from-layer="2336" from-port="0" to-layer="2337" to-port="0" /> + <edge from-layer="2337" from-port="1" to-layer="2340" to-port="0" /> + <edge from-layer="2338" from-port="0" to-layer="2339" to-port="0" /> + <edge from-layer="2339" from-port="1" to-layer="2340" to-port="1" /> + <edge from-layer="2340" from-port="2" to-layer="2342" to-port="0" /> + <edge from-layer="2341" from-port="0" to-layer="2342" to-port="1" /> + <edge from-layer="2342" from-port="2" to-layer="2343" to-port="0" /> + <edge from-layer="2343" from-port="1" to-layer="2344" to-port="1" /> + <edge from-layer="2344" from-port="2" to-layer="2346" to-port="0" /> + <edge from-layer="2345" from-port="0" to-layer="2346" to-port="1" /> + <edge from-layer="2346" from-port="2" to-layer="2348" to-port="0" /> + <edge from-layer="2347" from-port="0" to-layer="2348" to-port="1" /> + <edge from-layer="2348" from-port="2" to-layer="2462" to-port="0" /> + <edge from-layer="2348" from-port="2" to-layer="2352" to-port="0" /> + <edge from-layer="2348" from-port="2" to-layer="2364" to-port="0" /> + <edge from-layer="2349" from-port="0" to-layer="2352" to-port="1" /> + <edge from-layer="2350" from-port="0" to-layer="2352" to-port="2" /> + <edge from-layer="2351" from-port="0" to-layer="2352" to-port="3" /> + <edge from-layer="2352" from-port="4" to-layer="2354" to-port="0" /> + <edge from-layer="2353" from-port="0" to-layer="2354" to-port="1" /> + <edge from-layer="2354" from-port="2" to-layer="2358" to-port="0" /> + <edge from-layer="2355" from-port="0" to-layer="2358" to-port="1" /> + <edge from-layer="2356" from-port="0" to-layer="2358" to-port="2" /> + <edge from-layer="2357" from-port="0" to-layer="2358" to-port="3" /> + <edge from-layer="2358" from-port="4" to-layer="2404" to-port="0" /> + <edge from-layer="2358" from-port="4" to-layer="2409" to-port="0" /> + <edge from-layer="2358" from-port="4" to-layer="2393" to-port="0" /> + <edge from-layer="2358" from-port="4" to-layer="2390" to-port="0" /> + <edge from-layer="2359" from-port="0" to-layer="2386" to-port="0" /> + <edge from-layer="2360" from-port="0" to-layer="2386" to-port="1" /> + <edge from-layer="2361" from-port="0" to-layer="2364" to-port="1" /> + <edge from-layer="2362" from-port="0" to-layer="2364" to-port="2" /> + <edge from-layer="2363" from-port="0" to-layer="2364" to-port="3" /> + <edge from-layer="2364" from-port="4" to-layer="2365" to-port="0" /> + <edge from-layer="2364" from-port="4" to-layer="2421" to-port="0" /> + <edge from-layer="2365" from-port="1" to-layer="2368" to-port="0" /> + <edge from-layer="2366" from-port="0" to-layer="2368" to-port="1" /> + <edge from-layer="2367" from-port="0" to-layer="2368" to-port="2" /> + <edge from-layer="2368" from-port="3" to-layer="2384" to-port="0" /> + <edge from-layer="2369" from-port="0" to-layer="2374" to-port="0" /> + <edge from-layer="2370" from-port="0" to-layer="2373" to-port="1" /> + <edge from-layer="2371" from-port="0" to-layer="2373" to-port="2" /> + <edge from-layer="2372" from-port="0" to-layer="2373" to-port="3" /> + <edge from-layer="2373" from-port="4" to-layer="2374" to-port="1" /> + <edge from-layer="2374" from-port="2" to-layer="2375" to-port="0" /> + <edge from-layer="2375" from-port="1" to-layer="2377" to-port="0" /> + <edge from-layer="2376" from-port="0" to-layer="2377" to-port="2" /> + <edge from-layer="2377" from-port="3" to-layer="2378" to-port="0" /> + <edge from-layer="2377" from-port="3" to-layer="2449" to-port="0" /> + <edge from-layer="2378" from-port="1" to-layer="2381" to-port="0" /> + <edge from-layer="2379" from-port="0" to-layer="2381" to-port="1" /> + <edge from-layer="2380" from-port="0" to-layer="2381" to-port="2" /> + <edge from-layer="2381" from-port="3" to-layer="2473" to-port="0" /> + <edge from-layer="2381" from-port="3" to-layer="2383" to-port="0" /> + <edge from-layer="2382" from-port="0" to-layer="2383" to-port="1" /> + <edge from-layer="2383" from-port="2" to-layer="2384" to-port="1" /> + <edge from-layer="2384" from-port="2" to-layer="2386" to-port="2" /> + <edge from-layer="2384" from-port="2" to-layer="2414" to-port="2" /> + <edge from-layer="2385" from-port="0" to-layer="2386" to-port="3" /> + <edge from-layer="2386" from-port="4" to-layer="2388" to-port="0" /> + <edge from-layer="2387" from-port="0" to-layer="2388" to-port="2" /> + <edge from-layer="2388" from-port="3" to-layer="2389" to-port="0" /> + <edge from-layer="2389" from-port="2" to-layer="2390" to-port="1" /> + <edge from-layer="2389" from-port="2" to-layer="2426" to-port="1" /> + <edge from-layer="2390" from-port="2" to-layer="2419" to-port="0" /> + <edge from-layer="2391" from-port="0" to-layer="2401" to-port="0" /> + <edge from-layer="2392" from-port="0" to-layer="2401" to-port="1" /> + <edge from-layer="2393" from-port="1" to-layer="2395" to-port="0" /> + <edge from-layer="2394" from-port="0" to-layer="2395" to-port="2" /> + <edge from-layer="2395" from-port="3" to-layer="2396" to-port="0" /> + <edge from-layer="2396" from-port="2" to-layer="2397" to-port="0" /> + <edge from-layer="2397" from-port="1" to-layer="2399" to-port="0" /> + <edge from-layer="2398" from-port="0" to-layer="2399" to-port="1" /> + <edge from-layer="2399" from-port="2" to-layer="2401" to-port="2" /> + <edge from-layer="2400" from-port="0" to-layer="2401" to-port="3" /> + <edge from-layer="2401" from-port="4" to-layer="2409" to-port="2" /> + <edge from-layer="2401" from-port="4" to-layer="2404" to-port="1" /> + <edge from-layer="2402" from-port="0" to-layer="2404" to-port="2" /> + <edge from-layer="2403" from-port="0" to-layer="2404" to-port="3" /> + <edge from-layer="2404" from-port="4" to-layer="2406" to-port="0" /> + <edge from-layer="2405" from-port="0" to-layer="2406" to-port="1" /> + <edge from-layer="2406" from-port="2" to-layer="2410" to-port="0" /> + <edge from-layer="2407" from-port="0" to-layer="2409" to-port="1" /> + <edge from-layer="2408" from-port="0" to-layer="2409" to-port="3" /> + <edge from-layer="2409" from-port="4" to-layer="2410" to-port="1" /> + <edge from-layer="2410" from-port="2" to-layer="2418" to-port="0" /> + <edge from-layer="2411" from-port="0" to-layer="2414" to-port="0" /> + <edge from-layer="2412" from-port="0" to-layer="2414" to-port="1" /> + <edge from-layer="2413" from-port="0" to-layer="2414" to-port="3" /> + <edge from-layer="2414" from-port="4" to-layer="2416" to-port="0" /> + <edge from-layer="2415" from-port="0" to-layer="2416" to-port="2" /> + <edge from-layer="2416" from-port="3" to-layer="2417" to-port="0" /> + <edge from-layer="2417" from-port="2" to-layer="2418" to-port="1" /> + <edge from-layer="2417" from-port="2" to-layer="2447" to-port="1" /> + <edge from-layer="2418" from-port="2" to-layer="2419" to-port="1" /> + <edge from-layer="2419" from-port="2" to-layer="2510" to-port="0" /> + <edge from-layer="2419" from-port="2" to-layer="2474" to-port="0" /> + <edge from-layer="2420" from-port="0" to-layer="2421" to-port="1" /> + <edge from-layer="2421" from-port="2" to-layer="2425" to-port="0" /> + <edge from-layer="2422" from-port="0" to-layer="2425" to-port="1" /> + <edge from-layer="2423" from-port="0" to-layer="2425" to-port="2" /> + <edge from-layer="2424" from-port="0" to-layer="2425" to-port="3" /> + <edge from-layer="2425" from-port="4" to-layer="2440" to-port="0" /> + <edge from-layer="2425" from-port="4" to-layer="2426" to-port="0" /> + <edge from-layer="2425" from-port="4" to-layer="2445" to-port="0" /> + <edge from-layer="2425" from-port="4" to-layer="2429" to-port="0" /> + <edge from-layer="2426" from-port="2" to-layer="2448" to-port="0" /> + <edge from-layer="2427" from-port="0" to-layer="2437" to-port="0" /> + <edge from-layer="2428" from-port="0" to-layer="2437" to-port="1" /> + <edge from-layer="2429" from-port="1" to-layer="2431" to-port="0" /> + <edge from-layer="2430" from-port="0" to-layer="2431" to-port="2" /> + <edge from-layer="2431" from-port="3" to-layer="2432" to-port="0" /> + <edge from-layer="2432" from-port="2" to-layer="2433" to-port="0" /> + <edge from-layer="2433" from-port="1" to-layer="2435" to-port="0" /> + <edge from-layer="2434" from-port="0" to-layer="2435" to-port="1" /> + <edge from-layer="2435" from-port="2" to-layer="2437" to-port="2" /> + <edge from-layer="2436" from-port="0" to-layer="2437" to-port="3" /> + <edge from-layer="2437" from-port="4" to-layer="2440" to-port="1" /> + <edge from-layer="2437" from-port="4" to-layer="2445" to-port="2" /> + <edge from-layer="2438" from-port="0" to-layer="2440" to-port="2" /> + <edge from-layer="2439" from-port="0" to-layer="2440" to-port="3" /> + <edge from-layer="2440" from-port="4" to-layer="2442" to-port="0" /> + <edge from-layer="2441" from-port="0" to-layer="2442" to-port="1" /> + <edge from-layer="2442" from-port="2" to-layer="2446" to-port="0" /> + <edge from-layer="2443" from-port="0" to-layer="2445" to-port="1" /> + <edge from-layer="2444" from-port="0" to-layer="2445" to-port="3" /> + <edge from-layer="2445" from-port="4" to-layer="2446" to-port="1" /> + <edge from-layer="2446" from-port="2" to-layer="2447" to-port="0" /> + <edge from-layer="2447" from-port="2" to-layer="2448" to-port="1" /> + <edge from-layer="2448" from-port="2" to-layer="2449" to-port="1" /> + <edge from-layer="2448" from-port="2" to-layer="2469" to-port="0" /> + <edge from-layer="2449" from-port="2" to-layer="2510" to-port="1" /> + <edge from-layer="2449" from-port="2" to-layer="7236" to-port="0" /> + <edge from-layer="2450" from-port="0" to-layer="2455" to-port="0" /> + <edge from-layer="2451" from-port="0" to-layer="2454" to-port="1" /> + <edge from-layer="2452" from-port="0" to-layer="2454" to-port="2" /> + <edge from-layer="2453" from-port="0" to-layer="2454" to-port="3" /> + <edge from-layer="2454" from-port="4" to-layer="2455" to-port="1" /> + <edge from-layer="2455" from-port="2" to-layer="2456" to-port="0" /> + <edge from-layer="2456" from-port="1" to-layer="2458" to-port="0" /> + <edge from-layer="2457" from-port="0" to-layer="2458" to-port="2" /> + <edge from-layer="2458" from-port="3" to-layer="2465" to-port="0" /> + <edge from-layer="2459" from-port="0" to-layer="2462" to-port="1" /> + <edge from-layer="2460" from-port="0" to-layer="2462" to-port="2" /> + <edge from-layer="2461" from-port="0" to-layer="2462" to-port="3" /> + <edge from-layer="2462" from-port="4" to-layer="2464" to-port="0" /> + <edge from-layer="2463" from-port="0" to-layer="2464" to-port="1" /> + <edge from-layer="2464" from-port="2" to-layer="2465" to-port="1" /> + <edge from-layer="2465" from-port="2" to-layer="7235" to-port="0" /> + <edge from-layer="2465" from-port="2" to-layer="2510" to-port="2" /> + <edge from-layer="2466" from-port="0" to-layer="2488" to-port="0" /> + <edge from-layer="2467" from-port="0" to-layer="2482" to-port="0" /> + <edge from-layer="2468" from-port="0" to-layer="2486" to-port="1" /> + <edge from-layer="2468" from-port="0" to-layer="2482" to-port="1" /> + <edge from-layer="2469" from-port="1" to-layer="2472" to-port="0" /> + <edge from-layer="2470" from-port="0" to-layer="2472" to-port="1" /> + <edge from-layer="2471" from-port="0" to-layer="2472" to-port="2" /> + <edge from-layer="2472" from-port="3" to-layer="2473" to-port="1" /> + <edge from-layer="2473" from-port="2" to-layer="2478" to-port="0" /> + <edge from-layer="2473" from-port="2" to-layer="2485" to-port="0" /> + <edge from-layer="2474" from-port="1" to-layer="2503" to-port="0" /> + <edge from-layer="2474" from-port="1" to-layer="2477" to-port="0" /> + <edge from-layer="2475" from-port="0" to-layer="2477" to-port="1" /> + <edge from-layer="2476" from-port="0" to-layer="2477" to-port="2" /> + <edge from-layer="2477" from-port="3" to-layer="2478" to-port="1" /> + <edge from-layer="2478" from-port="2" to-layer="2480" to-port="0" /> + <edge from-layer="2479" from-port="0" to-layer="2480" to-port="1" /> + <edge from-layer="2480" from-port="2" to-layer="2482" to-port="2" /> + <edge from-layer="2481" from-port="0" to-layer="2486" to-port="3" /> + <edge from-layer="2481" from-port="0" to-layer="2482" to-port="3" /> + <edge from-layer="2482" from-port="4" to-layer="2488" to-port="1" /> + <edge from-layer="2483" from-port="0" to-layer="2486" to-port="0" /> + <edge from-layer="2484" from-port="0" to-layer="2485" to-port="1" /> + <edge from-layer="2485" from-port="2" to-layer="2486" to-port="2" /> + <edge from-layer="2485" from-port="2" to-layer="2493" to-port="2" /> + <edge from-layer="2486" from-port="4" to-layer="2488" to-port="2" /> + <edge from-layer="2487" from-port="0" to-layer="2488" to-port="3" /> + <edge from-layer="2488" from-port="4" to-layer="2495" to-port="0" /> + <edge from-layer="2489" from-port="0" to-layer="2495" to-port="1" /> + <edge from-layer="2490" from-port="0" to-layer="2493" to-port="0" /> + <edge from-layer="2491" from-port="0" to-layer="2493" to-port="1" /> + <edge from-layer="2492" from-port="0" to-layer="2493" to-port="3" /> + <edge from-layer="2493" from-port="4" to-layer="2495" to-port="2" /> + <edge from-layer="2494" from-port="0" to-layer="2495" to-port="3" /> + <edge from-layer="2495" from-port="4" to-layer="2498" to-port="0" /> + <edge from-layer="2496" from-port="0" to-layer="2498" to-port="1" /> + <edge from-layer="2497" from-port="0" to-layer="2498" to-port="2" /> + <edge from-layer="2498" from-port="3" to-layer="2499" to-port="0" /> + <edge from-layer="2499" from-port="2" to-layer="2500" to-port="0" /> + <edge from-layer="2499" from-port="2" to-layer="2509" to-port="0" /> + <edge from-layer="2500" from-port="1" to-layer="2508" to-port="0" /> + <edge from-layer="2501" from-port="0" to-layer="2503" to-port="1" /> + <edge from-layer="2502" from-port="0" to-layer="2503" to-port="2" /> + <edge from-layer="2503" from-port="3" to-layer="2507" to-port="0" /> + <edge from-layer="2504" from-port="0" to-layer="2507" to-port="1" /> + <edge from-layer="2505" from-port="0" to-layer="2507" to-port="2" /> + <edge from-layer="2506" from-port="0" to-layer="2507" to-port="3" /> + <edge from-layer="2507" from-port="4" to-layer="2508" to-port="1" /> + <edge from-layer="2508" from-port="2" to-layer="2509" to-port="1" /> + <edge from-layer="2509" from-port="2" to-layer="2510" to-port="3" /> + <edge from-layer="2510" from-port="4" to-layer="2512" to-port="0" /> + <edge from-layer="2511" from-port="0" to-layer="2512" to-port="1" /> + <edge from-layer="2512" from-port="2" to-layer="2514" to-port="0" /> + <edge from-layer="2513" from-port="0" to-layer="2514" to-port="1" /> + <edge from-layer="2514" from-port="2" to-layer="2523" to-port="0" /> + <edge from-layer="2515" from-port="0" to-layer="2516" to-port="0" /> + <edge from-layer="2516" from-port="1" to-layer="2519" to-port="0" /> + <edge from-layer="2517" from-port="0" to-layer="2518" to-port="0" /> + <edge from-layer="2518" from-port="1" to-layer="2519" to-port="1" /> + <edge from-layer="2519" from-port="2" to-layer="2521" to-port="0" /> + <edge from-layer="2520" from-port="0" to-layer="2521" to-port="1" /> + <edge from-layer="2521" from-port="2" to-layer="2522" to-port="0" /> + <edge from-layer="2522" from-port="1" to-layer="2523" to-port="1" /> + <edge from-layer="2523" from-port="2" to-layer="2525" to-port="0" /> + <edge from-layer="2524" from-port="0" to-layer="2525" to-port="1" /> + <edge from-layer="2525" from-port="2" to-layer="2526" to-port="0" /> + <edge from-layer="2526" from-port="2" to-layer="2556" to-port="1" /> + <edge from-layer="2526" from-port="2" to-layer="2528" to-port="0" /> + <edge from-layer="2527" from-port="0" to-layer="2528" to-port="1" /> + <edge from-layer="2528" from-port="2" to-layer="2530" to-port="0" /> + <edge from-layer="2529" from-port="0" to-layer="2530" to-port="1" /> + <edge from-layer="2530" from-port="2" to-layer="2532" to-port="0" /> + <edge from-layer="2531" from-port="0" to-layer="2532" to-port="1" /> + <edge from-layer="2532" from-port="2" to-layer="2541" to-port="0" /> + <edge from-layer="2533" from-port="0" to-layer="2534" to-port="0" /> + <edge from-layer="2534" from-port="1" to-layer="2537" to-port="0" /> + <edge from-layer="2535" from-port="0" to-layer="2536" to-port="0" /> + <edge from-layer="2536" from-port="1" to-layer="2537" to-port="1" /> + <edge from-layer="2537" from-port="2" to-layer="2539" to-port="0" /> + <edge from-layer="2538" from-port="0" to-layer="2539" to-port="1" /> + <edge from-layer="2539" from-port="2" to-layer="2540" to-port="0" /> + <edge from-layer="2540" from-port="1" to-layer="2541" to-port="1" /> + <edge from-layer="2541" from-port="2" to-layer="2543" to-port="0" /> + <edge from-layer="2542" from-port="0" to-layer="2543" to-port="1" /> + <edge from-layer="2543" from-port="2" to-layer="2544" to-port="0" /> + <edge from-layer="2544" from-port="1" to-layer="2553" to-port="0" /> + <edge from-layer="2545" from-port="0" to-layer="2546" to-port="0" /> + <edge from-layer="2546" from-port="1" to-layer="2549" to-port="0" /> + <edge from-layer="2547" from-port="0" to-layer="2548" to-port="0" /> + <edge from-layer="2548" from-port="1" to-layer="2549" to-port="1" /> + <edge from-layer="2549" from-port="2" to-layer="2551" to-port="0" /> + <edge from-layer="2550" from-port="0" to-layer="2551" to-port="1" /> + <edge from-layer="2551" from-port="2" to-layer="2552" to-port="0" /> + <edge from-layer="2552" from-port="1" to-layer="2553" to-port="1" /> + <edge from-layer="2553" from-port="2" to-layer="2555" to-port="0" /> + <edge from-layer="2554" from-port="0" to-layer="2555" to-port="1" /> + <edge from-layer="2555" from-port="2" to-layer="2556" to-port="0" /> + <edge from-layer="2556" from-port="2" to-layer="2558" to-port="0" /> + <edge from-layer="2556" from-port="2" to-layer="2753" to-port="1" /> + <edge from-layer="2557" from-port="0" to-layer="2558" to-port="1" /> + <edge from-layer="2558" from-port="2" to-layer="2560" to-port="0" /> + <edge from-layer="2559" from-port="0" to-layer="2560" to-port="1" /> + <edge from-layer="2560" from-port="2" to-layer="2562" to-port="0" /> + <edge from-layer="2561" from-port="0" to-layer="2562" to-port="1" /> + <edge from-layer="2562" from-port="2" to-layer="2571" to-port="0" /> + <edge from-layer="2563" from-port="0" to-layer="2564" to-port="0" /> + <edge from-layer="2564" from-port="1" to-layer="2567" to-port="0" /> + <edge from-layer="2565" from-port="0" to-layer="2566" to-port="0" /> + <edge from-layer="2566" from-port="1" to-layer="2567" to-port="1" /> + <edge from-layer="2567" from-port="2" to-layer="2569" to-port="0" /> + <edge from-layer="2568" from-port="0" to-layer="2569" to-port="1" /> + <edge from-layer="2569" from-port="2" to-layer="2570" to-port="0" /> + <edge from-layer="2570" from-port="1" to-layer="2571" to-port="1" /> + <edge from-layer="2571" from-port="2" to-layer="2573" to-port="0" /> + <edge from-layer="2572" from-port="0" to-layer="2573" to-port="1" /> + <edge from-layer="2573" from-port="2" to-layer="2575" to-port="0" /> + <edge from-layer="2574" from-port="0" to-layer="2575" to-port="1" /> + <edge from-layer="2575" from-port="2" to-layer="2689" to-port="0" /> + <edge from-layer="2575" from-port="2" to-layer="2579" to-port="0" /> + <edge from-layer="2575" from-port="2" to-layer="2591" to-port="0" /> + <edge from-layer="2576" from-port="0" to-layer="2579" to-port="1" /> + <edge from-layer="2577" from-port="0" to-layer="2579" to-port="2" /> + <edge from-layer="2578" from-port="0" to-layer="2579" to-port="3" /> + <edge from-layer="2579" from-port="4" to-layer="2581" to-port="0" /> + <edge from-layer="2580" from-port="0" to-layer="2581" to-port="1" /> + <edge from-layer="2581" from-port="2" to-layer="2585" to-port="0" /> + <edge from-layer="2582" from-port="0" to-layer="2585" to-port="1" /> + <edge from-layer="2583" from-port="0" to-layer="2585" to-port="2" /> + <edge from-layer="2584" from-port="0" to-layer="2585" to-port="3" /> + <edge from-layer="2585" from-port="4" to-layer="2636" to-port="0" /> + <edge from-layer="2585" from-port="4" to-layer="2620" to-port="0" /> + <edge from-layer="2585" from-port="4" to-layer="2631" to-port="0" /> + <edge from-layer="2585" from-port="4" to-layer="2617" to-port="0" /> + <edge from-layer="2586" from-port="0" to-layer="2613" to-port="0" /> + <edge from-layer="2587" from-port="0" to-layer="2613" to-port="1" /> + <edge from-layer="2588" from-port="0" to-layer="2591" to-port="1" /> + <edge from-layer="2589" from-port="0" to-layer="2591" to-port="2" /> + <edge from-layer="2590" from-port="0" to-layer="2591" to-port="3" /> + <edge from-layer="2591" from-port="4" to-layer="2592" to-port="0" /> + <edge from-layer="2591" from-port="4" to-layer="2648" to-port="0" /> + <edge from-layer="2592" from-port="1" to-layer="2595" to-port="0" /> + <edge from-layer="2593" from-port="0" to-layer="2595" to-port="1" /> + <edge from-layer="2594" from-port="0" to-layer="2595" to-port="2" /> + <edge from-layer="2595" from-port="3" to-layer="2611" to-port="0" /> + <edge from-layer="2596" from-port="0" to-layer="2601" to-port="0" /> + <edge from-layer="2597" from-port="0" to-layer="2600" to-port="1" /> + <edge from-layer="2598" from-port="0" to-layer="2600" to-port="2" /> + <edge from-layer="2599" from-port="0" to-layer="2600" to-port="3" /> + <edge from-layer="2600" from-port="4" to-layer="2601" to-port="1" /> + <edge from-layer="2601" from-port="2" to-layer="2602" to-port="0" /> + <edge from-layer="2602" from-port="1" to-layer="2604" to-port="0" /> + <edge from-layer="2603" from-port="0" to-layer="2604" to-port="2" /> + <edge from-layer="2604" from-port="3" to-layer="2676" to-port="0" /> + <edge from-layer="2604" from-port="3" to-layer="2605" to-port="0" /> + <edge from-layer="2605" from-port="1" to-layer="2608" to-port="0" /> + <edge from-layer="2606" from-port="0" to-layer="2608" to-port="1" /> + <edge from-layer="2607" from-port="0" to-layer="2608" to-port="2" /> + <edge from-layer="2608" from-port="3" to-layer="2700" to-port="0" /> + <edge from-layer="2608" from-port="3" to-layer="2610" to-port="0" /> + <edge from-layer="2609" from-port="0" to-layer="2610" to-port="1" /> + <edge from-layer="2610" from-port="2" to-layer="2611" to-port="1" /> + <edge from-layer="2611" from-port="2" to-layer="2641" to-port="2" /> + <edge from-layer="2611" from-port="2" to-layer="2613" to-port="2" /> + <edge from-layer="2612" from-port="0" to-layer="2613" to-port="3" /> + <edge from-layer="2613" from-port="4" to-layer="2615" to-port="0" /> + <edge from-layer="2614" from-port="0" to-layer="2615" to-port="2" /> + <edge from-layer="2615" from-port="3" to-layer="2616" to-port="0" /> + <edge from-layer="2616" from-port="2" to-layer="2617" to-port="1" /> + <edge from-layer="2616" from-port="2" to-layer="2653" to-port="1" /> + <edge from-layer="2617" from-port="2" to-layer="2646" to-port="0" /> + <edge from-layer="2618" from-port="0" to-layer="2628" to-port="0" /> + <edge from-layer="2619" from-port="0" to-layer="2628" to-port="1" /> + <edge from-layer="2620" from-port="1" to-layer="2622" to-port="0" /> + <edge from-layer="2621" from-port="0" to-layer="2622" to-port="2" /> + <edge from-layer="2622" from-port="3" to-layer="2623" to-port="0" /> + <edge from-layer="2623" from-port="2" to-layer="2624" to-port="0" /> + <edge from-layer="2624" from-port="1" to-layer="2626" to-port="0" /> + <edge from-layer="2625" from-port="0" to-layer="2626" to-port="1" /> + <edge from-layer="2626" from-port="2" to-layer="2628" to-port="2" /> + <edge from-layer="2627" from-port="0" to-layer="2628" to-port="3" /> + <edge from-layer="2628" from-port="4" to-layer="2631" to-port="1" /> + <edge from-layer="2628" from-port="4" to-layer="2636" to-port="2" /> + <edge from-layer="2629" from-port="0" to-layer="2631" to-port="2" /> + <edge from-layer="2630" from-port="0" to-layer="2631" to-port="3" /> + <edge from-layer="2631" from-port="4" to-layer="2633" to-port="0" /> + <edge from-layer="2632" from-port="0" to-layer="2633" to-port="1" /> + <edge from-layer="2633" from-port="2" to-layer="2637" to-port="0" /> + <edge from-layer="2634" from-port="0" to-layer="2636" to-port="1" /> + <edge from-layer="2635" from-port="0" to-layer="2636" to-port="3" /> + <edge from-layer="2636" from-port="4" to-layer="2637" to-port="1" /> + <edge from-layer="2637" from-port="2" to-layer="2645" to-port="0" /> + <edge from-layer="2638" from-port="0" to-layer="2641" to-port="0" /> + <edge from-layer="2639" from-port="0" to-layer="2641" to-port="1" /> + <edge from-layer="2640" from-port="0" to-layer="2641" to-port="3" /> + <edge from-layer="2641" from-port="4" to-layer="2643" to-port="0" /> + <edge from-layer="2642" from-port="0" to-layer="2643" to-port="2" /> + <edge from-layer="2643" from-port="3" to-layer="2644" to-port="0" /> + <edge from-layer="2644" from-port="2" to-layer="2645" to-port="1" /> + <edge from-layer="2644" from-port="2" to-layer="2674" to-port="1" /> + <edge from-layer="2645" from-port="2" to-layer="2646" to-port="1" /> + <edge from-layer="2646" from-port="2" to-layer="2737" to-port="0" /> + <edge from-layer="2646" from-port="2" to-layer="2701" to-port="0" /> + <edge from-layer="2647" from-port="0" to-layer="2648" to-port="1" /> + <edge from-layer="2648" from-port="2" to-layer="2652" to-port="0" /> + <edge from-layer="2649" from-port="0" to-layer="2652" to-port="1" /> + <edge from-layer="2650" from-port="0" to-layer="2652" to-port="2" /> + <edge from-layer="2651" from-port="0" to-layer="2652" to-port="3" /> + <edge from-layer="2652" from-port="4" to-layer="2672" to-port="0" /> + <edge from-layer="2652" from-port="4" to-layer="2667" to-port="0" /> + <edge from-layer="2652" from-port="4" to-layer="2656" to-port="0" /> + <edge from-layer="2652" from-port="4" to-layer="2653" to-port="0" /> + <edge from-layer="2653" from-port="2" to-layer="2675" to-port="0" /> + <edge from-layer="2654" from-port="0" to-layer="2664" to-port="0" /> + <edge from-layer="2655" from-port="0" to-layer="2664" to-port="1" /> + <edge from-layer="2656" from-port="1" to-layer="2658" to-port="0" /> + <edge from-layer="2657" from-port="0" to-layer="2658" to-port="2" /> + <edge from-layer="2658" from-port="3" to-layer="2659" to-port="0" /> + <edge from-layer="2659" from-port="2" to-layer="2660" to-port="0" /> + <edge from-layer="2660" from-port="1" to-layer="2662" to-port="0" /> + <edge from-layer="2661" from-port="0" to-layer="2662" to-port="1" /> + <edge from-layer="2662" from-port="2" to-layer="2664" to-port="2" /> + <edge from-layer="2663" from-port="0" to-layer="2664" to-port="3" /> + <edge from-layer="2664" from-port="4" to-layer="2667" to-port="1" /> + <edge from-layer="2664" from-port="4" to-layer="2672" to-port="2" /> + <edge from-layer="2665" from-port="0" to-layer="2667" to-port="2" /> + <edge from-layer="2666" from-port="0" to-layer="2667" to-port="3" /> + <edge from-layer="2667" from-port="4" to-layer="2669" to-port="0" /> + <edge from-layer="2668" from-port="0" to-layer="2669" to-port="1" /> + <edge from-layer="2669" from-port="2" to-layer="2673" to-port="0" /> + <edge from-layer="2670" from-port="0" to-layer="2672" to-port="1" /> + <edge from-layer="2671" from-port="0" to-layer="2672" to-port="3" /> + <edge from-layer="2672" from-port="4" to-layer="2673" to-port="1" /> + <edge from-layer="2673" from-port="2" to-layer="2674" to-port="0" /> + <edge from-layer="2674" from-port="2" to-layer="2675" to-port="1" /> + <edge from-layer="2675" from-port="2" to-layer="2696" to-port="0" /> + <edge from-layer="2675" from-port="2" to-layer="2676" to-port="1" /> + <edge from-layer="2676" from-port="2" to-layer="2737" to-port="1" /> + <edge from-layer="2676" from-port="2" to-layer="7234" to-port="0" /> + <edge from-layer="2677" from-port="0" to-layer="2682" to-port="0" /> + <edge from-layer="2678" from-port="0" to-layer="2681" to-port="1" /> + <edge from-layer="2679" from-port="0" to-layer="2681" to-port="2" /> + <edge from-layer="2680" from-port="0" to-layer="2681" to-port="3" /> + <edge from-layer="2681" from-port="4" to-layer="2682" to-port="1" /> + <edge from-layer="2682" from-port="2" to-layer="2683" to-port="0" /> + <edge from-layer="2683" from-port="1" to-layer="2685" to-port="0" /> + <edge from-layer="2684" from-port="0" to-layer="2685" to-port="2" /> + <edge from-layer="2685" from-port="3" to-layer="2692" to-port="0" /> + <edge from-layer="2686" from-port="0" to-layer="2689" to-port="1" /> + <edge from-layer="2687" from-port="0" to-layer="2689" to-port="2" /> + <edge from-layer="2688" from-port="0" to-layer="2689" to-port="3" /> + <edge from-layer="2689" from-port="4" to-layer="2691" to-port="0" /> + <edge from-layer="2690" from-port="0" to-layer="2691" to-port="1" /> + <edge from-layer="2691" from-port="2" to-layer="2692" to-port="1" /> + <edge from-layer="2692" from-port="2" to-layer="7233" to-port="0" /> + <edge from-layer="2692" from-port="2" to-layer="2737" to-port="2" /> + <edge from-layer="2693" from-port="0" to-layer="2715" to-port="0" /> + <edge from-layer="2694" from-port="0" to-layer="2709" to-port="0" /> + <edge from-layer="2695" from-port="0" to-layer="2709" to-port="1" /> + <edge from-layer="2695" from-port="0" to-layer="2713" to-port="1" /> + <edge from-layer="2696" from-port="1" to-layer="2699" to-port="0" /> + <edge from-layer="2697" from-port="0" to-layer="2699" to-port="1" /> + <edge from-layer="2698" from-port="0" to-layer="2699" to-port="2" /> + <edge from-layer="2699" from-port="3" to-layer="2700" to-port="1" /> + <edge from-layer="2700" from-port="2" to-layer="2705" to-port="0" /> + <edge from-layer="2700" from-port="2" to-layer="2712" to-port="0" /> + <edge from-layer="2701" from-port="1" to-layer="2704" to-port="0" /> + <edge from-layer="2701" from-port="1" to-layer="2730" to-port="0" /> + <edge from-layer="2702" from-port="0" to-layer="2704" to-port="1" /> + <edge from-layer="2703" from-port="0" to-layer="2704" to-port="2" /> + <edge from-layer="2704" from-port="3" to-layer="2705" to-port="1" /> + <edge from-layer="2705" from-port="2" to-layer="2707" to-port="0" /> + <edge from-layer="2706" from-port="0" to-layer="2707" to-port="1" /> + <edge from-layer="2707" from-port="2" to-layer="2709" to-port="2" /> + <edge from-layer="2708" from-port="0" to-layer="2709" to-port="3" /> + <edge from-layer="2708" from-port="0" to-layer="2713" to-port="3" /> + <edge from-layer="2709" from-port="4" to-layer="2715" to-port="1" /> + <edge from-layer="2710" from-port="0" to-layer="2713" to-port="0" /> + <edge from-layer="2711" from-port="0" to-layer="2712" to-port="1" /> + <edge from-layer="2712" from-port="2" to-layer="2713" to-port="2" /> + <edge from-layer="2712" from-port="2" to-layer="2720" to-port="2" /> + <edge from-layer="2713" from-port="4" to-layer="2715" to-port="2" /> + <edge from-layer="2714" from-port="0" to-layer="2715" to-port="3" /> + <edge from-layer="2715" from-port="4" to-layer="2722" to-port="0" /> + <edge from-layer="2716" from-port="0" to-layer="2722" to-port="1" /> + <edge from-layer="2717" from-port="0" to-layer="2720" to-port="0" /> + <edge from-layer="2718" from-port="0" to-layer="2720" to-port="1" /> + <edge from-layer="2719" from-port="0" to-layer="2720" to-port="3" /> + <edge from-layer="2720" from-port="4" to-layer="2722" to-port="2" /> + <edge from-layer="2721" from-port="0" to-layer="2722" to-port="3" /> + <edge from-layer="2722" from-port="4" to-layer="2725" to-port="0" /> + <edge from-layer="2723" from-port="0" to-layer="2725" to-port="1" /> + <edge from-layer="2724" from-port="0" to-layer="2725" to-port="2" /> + <edge from-layer="2725" from-port="3" to-layer="2726" to-port="0" /> + <edge from-layer="2726" from-port="2" to-layer="2727" to-port="0" /> + <edge from-layer="2726" from-port="2" to-layer="2736" to-port="0" /> + <edge from-layer="2727" from-port="1" to-layer="2735" to-port="0" /> + <edge from-layer="2728" from-port="0" to-layer="2730" to-port="1" /> + <edge from-layer="2729" from-port="0" to-layer="2730" to-port="2" /> + <edge from-layer="2730" from-port="3" to-layer="2734" to-port="0" /> + <edge from-layer="2731" from-port="0" to-layer="2734" to-port="1" /> + <edge from-layer="2732" from-port="0" to-layer="2734" to-port="2" /> + <edge from-layer="2733" from-port="0" to-layer="2734" to-port="3" /> + <edge from-layer="2734" from-port="4" to-layer="2735" to-port="1" /> + <edge from-layer="2735" from-port="2" to-layer="2736" to-port="1" /> + <edge from-layer="2736" from-port="2" to-layer="2737" to-port="3" /> + <edge from-layer="2737" from-port="4" to-layer="2739" to-port="0" /> + <edge from-layer="2738" from-port="0" to-layer="2739" to-port="1" /> + <edge from-layer="2739" from-port="2" to-layer="2741" to-port="0" /> + <edge from-layer="2740" from-port="0" to-layer="2741" to-port="1" /> + <edge from-layer="2741" from-port="2" to-layer="2750" to-port="0" /> + <edge from-layer="2742" from-port="0" to-layer="2743" to-port="0" /> + <edge from-layer="2743" from-port="1" to-layer="2746" to-port="0" /> + <edge from-layer="2744" from-port="0" to-layer="2745" to-port="0" /> + <edge from-layer="2745" from-port="1" to-layer="2746" to-port="1" /> + <edge from-layer="2746" from-port="2" to-layer="2748" to-port="0" /> + <edge from-layer="2747" from-port="0" to-layer="2748" to-port="1" /> + <edge from-layer="2748" from-port="2" to-layer="2749" to-port="0" /> + <edge from-layer="2749" from-port="1" to-layer="2750" to-port="1" /> + <edge from-layer="2750" from-port="2" to-layer="2752" to-port="0" /> + <edge from-layer="2751" from-port="0" to-layer="2752" to-port="1" /> + <edge from-layer="2752" from-port="2" to-layer="2753" to-port="0" /> + <edge from-layer="2753" from-port="2" to-layer="2783" to-port="1" /> + <edge from-layer="2753" from-port="2" to-layer="2755" to-port="0" /> + <edge from-layer="2754" from-port="0" to-layer="2755" to-port="1" /> + <edge from-layer="2755" from-port="2" to-layer="2757" to-port="0" /> + <edge from-layer="2756" from-port="0" to-layer="2757" to-port="1" /> + <edge from-layer="2757" from-port="2" to-layer="2759" to-port="0" /> + <edge from-layer="2758" from-port="0" to-layer="2759" to-port="1" /> + <edge from-layer="2759" from-port="2" to-layer="2768" to-port="0" /> + <edge from-layer="2760" from-port="0" to-layer="2761" to-port="0" /> + <edge from-layer="2761" from-port="1" to-layer="2764" to-port="0" /> + <edge from-layer="2762" from-port="0" to-layer="2763" to-port="0" /> + <edge from-layer="2763" from-port="1" to-layer="2764" to-port="1" /> + <edge from-layer="2764" from-port="2" to-layer="2766" to-port="0" /> + <edge from-layer="2765" from-port="0" to-layer="2766" to-port="1" /> + <edge from-layer="2766" from-port="2" to-layer="2767" to-port="0" /> + <edge from-layer="2767" from-port="1" to-layer="2768" to-port="1" /> + <edge from-layer="2768" from-port="2" to-layer="2770" to-port="0" /> + <edge from-layer="2769" from-port="0" to-layer="2770" to-port="1" /> + <edge from-layer="2770" from-port="2" to-layer="2771" to-port="0" /> + <edge from-layer="2771" from-port="1" to-layer="2780" to-port="0" /> + <edge from-layer="2772" from-port="0" to-layer="2773" to-port="0" /> + <edge from-layer="2773" from-port="1" to-layer="2776" to-port="0" /> + <edge from-layer="2774" from-port="0" to-layer="2775" to-port="0" /> + <edge from-layer="2775" from-port="1" to-layer="2776" to-port="1" /> + <edge from-layer="2776" from-port="2" to-layer="2778" to-port="0" /> + <edge from-layer="2777" from-port="0" to-layer="2778" to-port="1" /> + <edge from-layer="2778" from-port="2" to-layer="2779" to-port="0" /> + <edge from-layer="2779" from-port="1" to-layer="2780" to-port="1" /> + <edge from-layer="2780" from-port="2" to-layer="2782" to-port="0" /> + <edge from-layer="2781" from-port="0" to-layer="2782" to-port="1" /> + <edge from-layer="2782" from-port="2" to-layer="2783" to-port="0" /> + <edge from-layer="2783" from-port="2" to-layer="2785" to-port="0" /> + <edge from-layer="2783" from-port="2" to-layer="2980" to-port="1" /> + <edge from-layer="2784" from-port="0" to-layer="2785" to-port="1" /> + <edge from-layer="2785" from-port="2" to-layer="2787" to-port="0" /> + <edge from-layer="2786" from-port="0" to-layer="2787" to-port="1" /> + <edge from-layer="2787" from-port="2" to-layer="2789" to-port="0" /> + <edge from-layer="2788" from-port="0" to-layer="2789" to-port="1" /> + <edge from-layer="2789" from-port="2" to-layer="2798" to-port="0" /> + <edge from-layer="2790" from-port="0" to-layer="2791" to-port="0" /> + <edge from-layer="2791" from-port="1" to-layer="2794" to-port="0" /> + <edge from-layer="2792" from-port="0" to-layer="2793" to-port="0" /> + <edge from-layer="2793" from-port="1" to-layer="2794" to-port="1" /> + <edge from-layer="2794" from-port="2" to-layer="2796" to-port="0" /> + <edge from-layer="2795" from-port="0" to-layer="2796" to-port="1" /> + <edge from-layer="2796" from-port="2" to-layer="2797" to-port="0" /> + <edge from-layer="2797" from-port="1" to-layer="2798" to-port="1" /> + <edge from-layer="2798" from-port="2" to-layer="2800" to-port="0" /> + <edge from-layer="2799" from-port="0" to-layer="2800" to-port="1" /> + <edge from-layer="2800" from-port="2" to-layer="2802" to-port="0" /> + <edge from-layer="2801" from-port="0" to-layer="2802" to-port="1" /> + <edge from-layer="2802" from-port="2" to-layer="2916" to-port="0" /> + <edge from-layer="2802" from-port="2" to-layer="2806" to-port="0" /> + <edge from-layer="2802" from-port="2" to-layer="2818" to-port="0" /> + <edge from-layer="2803" from-port="0" to-layer="2806" to-port="1" /> + <edge from-layer="2804" from-port="0" to-layer="2806" to-port="2" /> + <edge from-layer="2805" from-port="0" to-layer="2806" to-port="3" /> + <edge from-layer="2806" from-port="4" to-layer="2808" to-port="0" /> + <edge from-layer="2807" from-port="0" to-layer="2808" to-port="1" /> + <edge from-layer="2808" from-port="2" to-layer="2812" to-port="0" /> + <edge from-layer="2809" from-port="0" to-layer="2812" to-port="1" /> + <edge from-layer="2810" from-port="0" to-layer="2812" to-port="2" /> + <edge from-layer="2811" from-port="0" to-layer="2812" to-port="3" /> + <edge from-layer="2812" from-port="4" to-layer="2863" to-port="0" /> + <edge from-layer="2812" from-port="4" to-layer="2858" to-port="0" /> + <edge from-layer="2812" from-port="4" to-layer="2847" to-port="0" /> + <edge from-layer="2812" from-port="4" to-layer="2844" to-port="0" /> + <edge from-layer="2813" from-port="0" to-layer="2840" to-port="0" /> + <edge from-layer="2814" from-port="0" to-layer="2840" to-port="1" /> + <edge from-layer="2815" from-port="0" to-layer="2818" to-port="1" /> + <edge from-layer="2816" from-port="0" to-layer="2818" to-port="2" /> + <edge from-layer="2817" from-port="0" to-layer="2818" to-port="3" /> + <edge from-layer="2818" from-port="4" to-layer="2875" to-port="0" /> + <edge from-layer="2818" from-port="4" to-layer="2819" to-port="0" /> + <edge from-layer="2819" from-port="1" to-layer="2822" to-port="0" /> + <edge from-layer="2820" from-port="0" to-layer="2822" to-port="1" /> + <edge from-layer="2821" from-port="0" to-layer="2822" to-port="2" /> + <edge from-layer="2822" from-port="3" to-layer="2838" to-port="0" /> + <edge from-layer="2823" from-port="0" to-layer="2828" to-port="0" /> + <edge from-layer="2824" from-port="0" to-layer="2827" to-port="1" /> + <edge from-layer="2825" from-port="0" to-layer="2827" to-port="2" /> + <edge from-layer="2826" from-port="0" to-layer="2827" to-port="3" /> + <edge from-layer="2827" from-port="4" to-layer="2828" to-port="1" /> + <edge from-layer="2828" from-port="2" to-layer="2829" to-port="0" /> + <edge from-layer="2829" from-port="1" to-layer="2831" to-port="0" /> + <edge from-layer="2830" from-port="0" to-layer="2831" to-port="2" /> + <edge from-layer="2831" from-port="3" to-layer="2903" to-port="0" /> + <edge from-layer="2831" from-port="3" to-layer="2832" to-port="0" /> + <edge from-layer="2832" from-port="1" to-layer="2835" to-port="0" /> + <edge from-layer="2833" from-port="0" to-layer="2835" to-port="1" /> + <edge from-layer="2834" from-port="0" to-layer="2835" to-port="2" /> + <edge from-layer="2835" from-port="3" to-layer="2837" to-port="0" /> + <edge from-layer="2835" from-port="3" to-layer="2927" to-port="0" /> + <edge from-layer="2836" from-port="0" to-layer="2837" to-port="1" /> + <edge from-layer="2837" from-port="2" to-layer="2838" to-port="1" /> + <edge from-layer="2838" from-port="2" to-layer="2868" to-port="2" /> + <edge from-layer="2838" from-port="2" to-layer="2840" to-port="2" /> + <edge from-layer="2839" from-port="0" to-layer="2840" to-port="3" /> + <edge from-layer="2840" from-port="4" to-layer="2842" to-port="0" /> + <edge from-layer="2841" from-port="0" to-layer="2842" to-port="2" /> + <edge from-layer="2842" from-port="3" to-layer="2843" to-port="0" /> + <edge from-layer="2843" from-port="2" to-layer="2844" to-port="1" /> + <edge from-layer="2843" from-port="2" to-layer="2880" to-port="1" /> + <edge from-layer="2844" from-port="2" to-layer="2873" to-port="0" /> + <edge from-layer="2845" from-port="0" to-layer="2855" to-port="0" /> + <edge from-layer="2846" from-port="0" to-layer="2855" to-port="1" /> + <edge from-layer="2847" from-port="1" to-layer="2849" to-port="0" /> + <edge from-layer="2848" from-port="0" to-layer="2849" to-port="2" /> + <edge from-layer="2849" from-port="3" to-layer="2850" to-port="0" /> + <edge from-layer="2850" from-port="2" to-layer="2851" to-port="0" /> + <edge from-layer="2851" from-port="1" to-layer="2853" to-port="0" /> + <edge from-layer="2852" from-port="0" to-layer="2853" to-port="1" /> + <edge from-layer="2853" from-port="2" to-layer="2855" to-port="2" /> + <edge from-layer="2854" from-port="0" to-layer="2855" to-port="3" /> + <edge from-layer="2855" from-port="4" to-layer="2858" to-port="1" /> + <edge from-layer="2855" from-port="4" to-layer="2863" to-port="2" /> + <edge from-layer="2856" from-port="0" to-layer="2858" to-port="2" /> + <edge from-layer="2857" from-port="0" to-layer="2858" to-port="3" /> + <edge from-layer="2858" from-port="4" to-layer="2860" to-port="0" /> + <edge from-layer="2859" from-port="0" to-layer="2860" to-port="1" /> + <edge from-layer="2860" from-port="2" to-layer="2864" to-port="0" /> + <edge from-layer="2861" from-port="0" to-layer="2863" to-port="1" /> + <edge from-layer="2862" from-port="0" to-layer="2863" to-port="3" /> + <edge from-layer="2863" from-port="4" to-layer="2864" to-port="1" /> + <edge from-layer="2864" from-port="2" to-layer="2872" to-port="0" /> + <edge from-layer="2865" from-port="0" to-layer="2868" to-port="0" /> + <edge from-layer="2866" from-port="0" to-layer="2868" to-port="1" /> + <edge from-layer="2867" from-port="0" to-layer="2868" to-port="3" /> + <edge from-layer="2868" from-port="4" to-layer="2870" to-port="0" /> + <edge from-layer="2869" from-port="0" to-layer="2870" to-port="2" /> + <edge from-layer="2870" from-port="3" to-layer="2871" to-port="0" /> + <edge from-layer="2871" from-port="2" to-layer="2872" to-port="1" /> + <edge from-layer="2871" from-port="2" to-layer="2901" to-port="1" /> + <edge from-layer="2872" from-port="2" to-layer="2873" to-port="1" /> + <edge from-layer="2873" from-port="2" to-layer="2928" to-port="0" /> + <edge from-layer="2873" from-port="2" to-layer="2964" to-port="0" /> + <edge from-layer="2874" from-port="0" to-layer="2875" to-port="1" /> + <edge from-layer="2875" from-port="2" to-layer="2879" to-port="0" /> + <edge from-layer="2876" from-port="0" to-layer="2879" to-port="1" /> + <edge from-layer="2877" from-port="0" to-layer="2879" to-port="2" /> + <edge from-layer="2878" from-port="0" to-layer="2879" to-port="3" /> + <edge from-layer="2879" from-port="4" to-layer="2880" to-port="0" /> + <edge from-layer="2879" from-port="4" to-layer="2883" to-port="0" /> + <edge from-layer="2879" from-port="4" to-layer="2894" to-port="0" /> + <edge from-layer="2879" from-port="4" to-layer="2899" to-port="0" /> + <edge from-layer="2880" from-port="2" to-layer="2902" to-port="0" /> + <edge from-layer="2881" from-port="0" to-layer="2891" to-port="0" /> + <edge from-layer="2882" from-port="0" to-layer="2891" to-port="1" /> + <edge from-layer="2883" from-port="1" to-layer="2885" to-port="0" /> + <edge from-layer="2884" from-port="0" to-layer="2885" to-port="2" /> + <edge from-layer="2885" from-port="3" to-layer="2886" to-port="0" /> + <edge from-layer="2886" from-port="2" to-layer="2887" to-port="0" /> + <edge from-layer="2887" from-port="1" to-layer="2889" to-port="0" /> + <edge from-layer="2888" from-port="0" to-layer="2889" to-port="1" /> + <edge from-layer="2889" from-port="2" to-layer="2891" to-port="2" /> + <edge from-layer="2890" from-port="0" to-layer="2891" to-port="3" /> + <edge from-layer="2891" from-port="4" to-layer="2894" to-port="1" /> + <edge from-layer="2891" from-port="4" to-layer="2899" to-port="2" /> + <edge from-layer="2892" from-port="0" to-layer="2894" to-port="2" /> + <edge from-layer="2893" from-port="0" to-layer="2894" to-port="3" /> + <edge from-layer="2894" from-port="4" to-layer="2896" to-port="0" /> + <edge from-layer="2895" from-port="0" to-layer="2896" to-port="1" /> + <edge from-layer="2896" from-port="2" to-layer="2900" to-port="0" /> + <edge from-layer="2897" from-port="0" to-layer="2899" to-port="1" /> + <edge from-layer="2898" from-port="0" to-layer="2899" to-port="3" /> + <edge from-layer="2899" from-port="4" to-layer="2900" to-port="1" /> + <edge from-layer="2900" from-port="2" to-layer="2901" to-port="0" /> + <edge from-layer="2901" from-port="2" to-layer="2902" to-port="1" /> + <edge from-layer="2902" from-port="2" to-layer="2903" to-port="1" /> + <edge from-layer="2902" from-port="2" to-layer="2923" to-port="0" /> + <edge from-layer="2903" from-port="2" to-layer="2964" to-port="1" /> + <edge from-layer="2903" from-port="2" to-layer="7232" to-port="0" /> + <edge from-layer="2904" from-port="0" to-layer="2909" to-port="0" /> + <edge from-layer="2905" from-port="0" to-layer="2908" to-port="1" /> + <edge from-layer="2906" from-port="0" to-layer="2908" to-port="2" /> + <edge from-layer="2907" from-port="0" to-layer="2908" to-port="3" /> + <edge from-layer="2908" from-port="4" to-layer="2909" to-port="1" /> + <edge from-layer="2909" from-port="2" to-layer="2910" to-port="0" /> + <edge from-layer="2910" from-port="1" to-layer="2912" to-port="0" /> + <edge from-layer="2911" from-port="0" to-layer="2912" to-port="2" /> + <edge from-layer="2912" from-port="3" to-layer="2919" to-port="0" /> + <edge from-layer="2913" from-port="0" to-layer="2916" to-port="1" /> + <edge from-layer="2914" from-port="0" to-layer="2916" to-port="2" /> + <edge from-layer="2915" from-port="0" to-layer="2916" to-port="3" /> + <edge from-layer="2916" from-port="4" to-layer="2918" to-port="0" /> + <edge from-layer="2917" from-port="0" to-layer="2918" to-port="1" /> + <edge from-layer="2918" from-port="2" to-layer="2919" to-port="1" /> + <edge from-layer="2919" from-port="2" to-layer="7231" to-port="0" /> + <edge from-layer="2919" from-port="2" to-layer="2964" to-port="2" /> + <edge from-layer="2920" from-port="0" to-layer="2942" to-port="0" /> + <edge from-layer="2921" from-port="0" to-layer="2936" to-port="0" /> + <edge from-layer="2922" from-port="0" to-layer="2940" to-port="1" /> + <edge from-layer="2922" from-port="0" to-layer="2936" to-port="1" /> + <edge from-layer="2923" from-port="1" to-layer="2926" to-port="0" /> + <edge from-layer="2924" from-port="0" to-layer="2926" to-port="1" /> + <edge from-layer="2925" from-port="0" to-layer="2926" to-port="2" /> + <edge from-layer="2926" from-port="3" to-layer="2927" to-port="1" /> + <edge from-layer="2927" from-port="2" to-layer="2932" to-port="0" /> + <edge from-layer="2927" from-port="2" to-layer="2939" to-port="0" /> + <edge from-layer="2928" from-port="1" to-layer="2957" to-port="0" /> + <edge from-layer="2928" from-port="1" to-layer="2931" to-port="0" /> + <edge from-layer="2929" from-port="0" to-layer="2931" to-port="1" /> + <edge from-layer="2930" from-port="0" to-layer="2931" to-port="2" /> + <edge from-layer="2931" from-port="3" to-layer="2932" to-port="1" /> + <edge from-layer="2932" from-port="2" to-layer="2934" to-port="0" /> + <edge from-layer="2933" from-port="0" to-layer="2934" to-port="1" /> + <edge from-layer="2934" from-port="2" to-layer="2936" to-port="2" /> + <edge from-layer="2935" from-port="0" to-layer="2936" to-port="3" /> + <edge from-layer="2935" from-port="0" to-layer="2940" to-port="3" /> + <edge from-layer="2936" from-port="4" to-layer="2942" to-port="1" /> + <edge from-layer="2937" from-port="0" to-layer="2940" to-port="0" /> + <edge from-layer="2938" from-port="0" to-layer="2939" to-port="1" /> + <edge from-layer="2939" from-port="2" to-layer="2947" to-port="2" /> + <edge from-layer="2939" from-port="2" to-layer="2940" to-port="2" /> + <edge from-layer="2940" from-port="4" to-layer="2942" to-port="2" /> + <edge from-layer="2941" from-port="0" to-layer="2942" to-port="3" /> + <edge from-layer="2942" from-port="4" to-layer="2949" to-port="0" /> + <edge from-layer="2943" from-port="0" to-layer="2949" to-port="1" /> + <edge from-layer="2944" from-port="0" to-layer="2947" to-port="0" /> + <edge from-layer="2945" from-port="0" to-layer="2947" to-port="1" /> + <edge from-layer="2946" from-port="0" to-layer="2947" to-port="3" /> + <edge from-layer="2947" from-port="4" to-layer="2949" to-port="2" /> + <edge from-layer="2948" from-port="0" to-layer="2949" to-port="3" /> + <edge from-layer="2949" from-port="4" to-layer="2952" to-port="0" /> + <edge from-layer="2950" from-port="0" to-layer="2952" to-port="1" /> + <edge from-layer="2951" from-port="0" to-layer="2952" to-port="2" /> + <edge from-layer="2952" from-port="3" to-layer="2953" to-port="0" /> + <edge from-layer="2953" from-port="2" to-layer="2954" to-port="0" /> + <edge from-layer="2953" from-port="2" to-layer="2963" to-port="0" /> + <edge from-layer="2954" from-port="1" to-layer="2962" to-port="0" /> + <edge from-layer="2955" from-port="0" to-layer="2957" to-port="1" /> + <edge from-layer="2956" from-port="0" to-layer="2957" to-port="2" /> + <edge from-layer="2957" from-port="3" to-layer="2961" to-port="0" /> + <edge from-layer="2958" from-port="0" to-layer="2961" to-port="1" /> + <edge from-layer="2959" from-port="0" to-layer="2961" to-port="2" /> + <edge from-layer="2960" from-port="0" to-layer="2961" to-port="3" /> + <edge from-layer="2961" from-port="4" to-layer="2962" to-port="1" /> + <edge from-layer="2962" from-port="2" to-layer="2963" to-port="1" /> + <edge from-layer="2963" from-port="2" to-layer="2964" to-port="3" /> + <edge from-layer="2964" from-port="4" to-layer="2966" to-port="0" /> + <edge from-layer="2965" from-port="0" to-layer="2966" to-port="1" /> + <edge from-layer="2966" from-port="2" to-layer="2968" to-port="0" /> + <edge from-layer="2967" from-port="0" to-layer="2968" to-port="1" /> + <edge from-layer="2968" from-port="2" to-layer="2977" to-port="0" /> + <edge from-layer="2969" from-port="0" to-layer="2970" to-port="0" /> + <edge from-layer="2970" from-port="1" to-layer="2973" to-port="0" /> + <edge from-layer="2971" from-port="0" to-layer="2972" to-port="0" /> + <edge from-layer="2972" from-port="1" to-layer="2973" to-port="1" /> + <edge from-layer="2973" from-port="2" to-layer="2975" to-port="0" /> + <edge from-layer="2974" from-port="0" to-layer="2975" to-port="1" /> + <edge from-layer="2975" from-port="2" to-layer="2976" to-port="0" /> + <edge from-layer="2976" from-port="1" to-layer="2977" to-port="1" /> + <edge from-layer="2977" from-port="2" to-layer="2979" to-port="0" /> + <edge from-layer="2978" from-port="0" to-layer="2979" to-port="1" /> + <edge from-layer="2979" from-port="2" to-layer="2980" to-port="0" /> + <edge from-layer="2980" from-port="2" to-layer="2982" to-port="0" /> + <edge from-layer="2980" from-port="2" to-layer="3010" to-port="1" /> + <edge from-layer="2981" from-port="0" to-layer="2982" to-port="1" /> + <edge from-layer="2982" from-port="2" to-layer="2984" to-port="0" /> + <edge from-layer="2983" from-port="0" to-layer="2984" to-port="1" /> + <edge from-layer="2984" from-port="2" to-layer="2986" to-port="0" /> + <edge from-layer="2985" from-port="0" to-layer="2986" to-port="1" /> + <edge from-layer="2986" from-port="2" to-layer="2995" to-port="0" /> + <edge from-layer="2987" from-port="0" to-layer="2988" to-port="0" /> + <edge from-layer="2988" from-port="1" to-layer="2991" to-port="0" /> + <edge from-layer="2989" from-port="0" to-layer="2990" to-port="0" /> + <edge from-layer="2990" from-port="1" to-layer="2991" to-port="1" /> + <edge from-layer="2991" from-port="2" to-layer="2993" to-port="0" /> + <edge from-layer="2992" from-port="0" to-layer="2993" to-port="1" /> + <edge from-layer="2993" from-port="2" to-layer="2994" to-port="0" /> + <edge from-layer="2994" from-port="1" to-layer="2995" to-port="1" /> + <edge from-layer="2995" from-port="2" to-layer="2997" to-port="0" /> + <edge from-layer="2996" from-port="0" to-layer="2997" to-port="1" /> + <edge from-layer="2997" from-port="2" to-layer="2998" to-port="0" /> + <edge from-layer="2998" from-port="1" to-layer="3007" to-port="0" /> + <edge from-layer="2999" from-port="0" to-layer="3000" to-port="0" /> + <edge from-layer="3000" from-port="1" to-layer="3003" to-port="0" /> + <edge from-layer="3001" from-port="0" to-layer="3002" to-port="0" /> + <edge from-layer="3002" from-port="1" to-layer="3003" to-port="1" /> + <edge from-layer="3003" from-port="2" to-layer="3005" to-port="0" /> + <edge from-layer="3004" from-port="0" to-layer="3005" to-port="1" /> + <edge from-layer="3005" from-port="2" to-layer="3006" to-port="0" /> + <edge from-layer="3006" from-port="1" to-layer="3007" to-port="1" /> + <edge from-layer="3007" from-port="2" to-layer="3009" to-port="0" /> + <edge from-layer="3008" from-port="0" to-layer="3009" to-port="1" /> + <edge from-layer="3009" from-port="2" to-layer="3010" to-port="0" /> + <edge from-layer="3010" from-port="2" to-layer="3207" to-port="1" /> + <edge from-layer="3010" from-port="2" to-layer="3012" to-port="0" /> + <edge from-layer="3011" from-port="0" to-layer="3012" to-port="1" /> + <edge from-layer="3012" from-port="2" to-layer="3014" to-port="0" /> + <edge from-layer="3013" from-port="0" to-layer="3014" to-port="1" /> + <edge from-layer="3014" from-port="2" to-layer="3016" to-port="0" /> + <edge from-layer="3015" from-port="0" to-layer="3016" to-port="1" /> + <edge from-layer="3016" from-port="2" to-layer="3025" to-port="0" /> + <edge from-layer="3017" from-port="0" to-layer="3018" to-port="0" /> + <edge from-layer="3018" from-port="1" to-layer="3021" to-port="0" /> + <edge from-layer="3019" from-port="0" to-layer="3020" to-port="0" /> + <edge from-layer="3020" from-port="1" to-layer="3021" to-port="1" /> + <edge from-layer="3021" from-port="2" to-layer="3023" to-port="0" /> + <edge from-layer="3022" from-port="0" to-layer="3023" to-port="1" /> + <edge from-layer="3023" from-port="2" to-layer="3024" to-port="0" /> + <edge from-layer="3024" from-port="1" to-layer="3025" to-port="1" /> + <edge from-layer="3025" from-port="2" to-layer="3027" to-port="0" /> + <edge from-layer="3026" from-port="0" to-layer="3027" to-port="1" /> + <edge from-layer="3027" from-port="2" to-layer="3029" to-port="0" /> + <edge from-layer="3028" from-port="0" to-layer="3029" to-port="1" /> + <edge from-layer="3029" from-port="2" to-layer="3033" to-port="0" /> + <edge from-layer="3029" from-port="2" to-layer="3143" to-port="0" /> + <edge from-layer="3029" from-port="2" to-layer="3045" to-port="0" /> + <edge from-layer="3030" from-port="0" to-layer="3033" to-port="1" /> + <edge from-layer="3031" from-port="0" to-layer="3033" to-port="2" /> + <edge from-layer="3032" from-port="0" to-layer="3033" to-port="3" /> + <edge from-layer="3033" from-port="4" to-layer="3035" to-port="0" /> + <edge from-layer="3034" from-port="0" to-layer="3035" to-port="1" /> + <edge from-layer="3035" from-port="2" to-layer="3039" to-port="0" /> + <edge from-layer="3036" from-port="0" to-layer="3039" to-port="1" /> + <edge from-layer="3037" from-port="0" to-layer="3039" to-port="2" /> + <edge from-layer="3038" from-port="0" to-layer="3039" to-port="3" /> + <edge from-layer="3039" from-port="4" to-layer="3090" to-port="0" /> + <edge from-layer="3039" from-port="4" to-layer="3071" to-port="0" /> + <edge from-layer="3039" from-port="4" to-layer="3074" to-port="0" /> + <edge from-layer="3039" from-port="4" to-layer="3085" to-port="0" /> + <edge from-layer="3040" from-port="0" to-layer="3067" to-port="0" /> + <edge from-layer="3041" from-port="0" to-layer="3067" to-port="1" /> + <edge from-layer="3042" from-port="0" to-layer="3045" to-port="1" /> + <edge from-layer="3043" from-port="0" to-layer="3045" to-port="2" /> + <edge from-layer="3044" from-port="0" to-layer="3045" to-port="3" /> + <edge from-layer="3045" from-port="4" to-layer="3046" to-port="0" /> + <edge from-layer="3045" from-port="4" to-layer="3102" to-port="0" /> + <edge from-layer="3046" from-port="1" to-layer="3049" to-port="0" /> + <edge from-layer="3047" from-port="0" to-layer="3049" to-port="1" /> + <edge from-layer="3048" from-port="0" to-layer="3049" to-port="2" /> + <edge from-layer="3049" from-port="3" to-layer="3065" to-port="0" /> + <edge from-layer="3050" from-port="0" to-layer="3055" to-port="0" /> + <edge from-layer="3051" from-port="0" to-layer="3054" to-port="1" /> + <edge from-layer="3052" from-port="0" to-layer="3054" to-port="2" /> + <edge from-layer="3053" from-port="0" to-layer="3054" to-port="3" /> + <edge from-layer="3054" from-port="4" to-layer="3055" to-port="1" /> + <edge from-layer="3055" from-port="2" to-layer="3056" to-port="0" /> + <edge from-layer="3056" from-port="1" to-layer="3058" to-port="0" /> + <edge from-layer="3057" from-port="0" to-layer="3058" to-port="2" /> + <edge from-layer="3058" from-port="3" to-layer="3059" to-port="0" /> + <edge from-layer="3058" from-port="3" to-layer="3130" to-port="0" /> + <edge from-layer="3059" from-port="1" to-layer="3062" to-port="0" /> + <edge from-layer="3060" from-port="0" to-layer="3062" to-port="1" /> + <edge from-layer="3061" from-port="0" to-layer="3062" to-port="2" /> + <edge from-layer="3062" from-port="3" to-layer="3064" to-port="0" /> + <edge from-layer="3062" from-port="3" to-layer="3154" to-port="0" /> + <edge from-layer="3063" from-port="0" to-layer="3064" to-port="1" /> + <edge from-layer="3064" from-port="2" to-layer="3065" to-port="1" /> + <edge from-layer="3065" from-port="2" to-layer="3067" to-port="2" /> + <edge from-layer="3065" from-port="2" to-layer="3095" to-port="2" /> + <edge from-layer="3066" from-port="0" to-layer="3067" to-port="3" /> + <edge from-layer="3067" from-port="4" to-layer="3069" to-port="0" /> + <edge from-layer="3068" from-port="0" to-layer="3069" to-port="2" /> + <edge from-layer="3069" from-port="3" to-layer="3070" to-port="0" /> + <edge from-layer="3070" from-port="2" to-layer="3107" to-port="1" /> + <edge from-layer="3070" from-port="2" to-layer="3071" to-port="1" /> + <edge from-layer="3071" from-port="2" to-layer="3100" to-port="0" /> + <edge from-layer="3072" from-port="0" to-layer="3082" to-port="0" /> + <edge from-layer="3073" from-port="0" to-layer="3082" to-port="1" /> + <edge from-layer="3074" from-port="1" to-layer="3076" to-port="0" /> + <edge from-layer="3075" from-port="0" to-layer="3076" to-port="2" /> + <edge from-layer="3076" from-port="3" to-layer="3077" to-port="0" /> + <edge from-layer="3077" from-port="2" to-layer="3078" to-port="0" /> + <edge from-layer="3078" from-port="1" to-layer="3080" to-port="0" /> + <edge from-layer="3079" from-port="0" to-layer="3080" to-port="1" /> + <edge from-layer="3080" from-port="2" to-layer="3082" to-port="2" /> + <edge from-layer="3081" from-port="0" to-layer="3082" to-port="3" /> + <edge from-layer="3082" from-port="4" to-layer="3090" to-port="2" /> + <edge from-layer="3082" from-port="4" to-layer="3085" to-port="1" /> + <edge from-layer="3083" from-port="0" to-layer="3085" to-port="2" /> + <edge from-layer="3084" from-port="0" to-layer="3085" to-port="3" /> + <edge from-layer="3085" from-port="4" to-layer="3087" to-port="0" /> + <edge from-layer="3086" from-port="0" to-layer="3087" to-port="1" /> + <edge from-layer="3087" from-port="2" to-layer="3091" to-port="0" /> + <edge from-layer="3088" from-port="0" to-layer="3090" to-port="1" /> + <edge from-layer="3089" from-port="0" to-layer="3090" to-port="3" /> + <edge from-layer="3090" from-port="4" to-layer="3091" to-port="1" /> + <edge from-layer="3091" from-port="2" to-layer="3099" to-port="0" /> + <edge from-layer="3092" from-port="0" to-layer="3095" to-port="0" /> + <edge from-layer="3093" from-port="0" to-layer="3095" to-port="1" /> + <edge from-layer="3094" from-port="0" to-layer="3095" to-port="3" /> + <edge from-layer="3095" from-port="4" to-layer="3097" to-port="0" /> + <edge from-layer="3096" from-port="0" to-layer="3097" to-port="2" /> + <edge from-layer="3097" from-port="3" to-layer="3098" to-port="0" /> + <edge from-layer="3098" from-port="2" to-layer="3128" to-port="1" /> + <edge from-layer="3098" from-port="2" to-layer="3099" to-port="1" /> + <edge from-layer="3099" from-port="2" to-layer="3100" to-port="1" /> + <edge from-layer="3100" from-port="2" to-layer="3155" to-port="0" /> + <edge from-layer="3100" from-port="2" to-layer="3191" to-port="0" /> + <edge from-layer="3101" from-port="0" to-layer="3102" to-port="1" /> + <edge from-layer="3102" from-port="2" to-layer="3106" to-port="0" /> + <edge from-layer="3103" from-port="0" to-layer="3106" to-port="1" /> + <edge from-layer="3104" from-port="0" to-layer="3106" to-port="2" /> + <edge from-layer="3105" from-port="0" to-layer="3106" to-port="3" /> + <edge from-layer="3106" from-port="4" to-layer="3121" to-port="0" /> + <edge from-layer="3106" from-port="4" to-layer="3107" to-port="0" /> + <edge from-layer="3106" from-port="4" to-layer="3126" to-port="0" /> + <edge from-layer="3106" from-port="4" to-layer="3110" to-port="0" /> + <edge from-layer="3107" from-port="2" to-layer="3129" to-port="0" /> + <edge from-layer="3108" from-port="0" to-layer="3118" to-port="0" /> + <edge from-layer="3109" from-port="0" to-layer="3118" to-port="1" /> + <edge from-layer="3110" from-port="1" to-layer="3112" to-port="0" /> + <edge from-layer="3111" from-port="0" to-layer="3112" to-port="2" /> + <edge from-layer="3112" from-port="3" to-layer="3113" to-port="0" /> + <edge from-layer="3113" from-port="2" to-layer="3114" to-port="0" /> + <edge from-layer="3114" from-port="1" to-layer="3116" to-port="0" /> + <edge from-layer="3115" from-port="0" to-layer="3116" to-port="1" /> + <edge from-layer="3116" from-port="2" to-layer="3118" to-port="2" /> + <edge from-layer="3117" from-port="0" to-layer="3118" to-port="3" /> + <edge from-layer="3118" from-port="4" to-layer="3126" to-port="2" /> + <edge from-layer="3118" from-port="4" to-layer="3121" to-port="1" /> + <edge from-layer="3119" from-port="0" to-layer="3121" to-port="2" /> + <edge from-layer="3120" from-port="0" to-layer="3121" to-port="3" /> + <edge from-layer="3121" from-port="4" to-layer="3123" to-port="0" /> + <edge from-layer="3122" from-port="0" to-layer="3123" to-port="1" /> + <edge from-layer="3123" from-port="2" to-layer="3127" to-port="0" /> + <edge from-layer="3124" from-port="0" to-layer="3126" to-port="1" /> + <edge from-layer="3125" from-port="0" to-layer="3126" to-port="3" /> + <edge from-layer="3126" from-port="4" to-layer="3127" to-port="1" /> + <edge from-layer="3127" from-port="2" to-layer="3128" to-port="0" /> + <edge from-layer="3128" from-port="2" to-layer="3129" to-port="1" /> + <edge from-layer="3129" from-port="2" to-layer="3130" to-port="1" /> + <edge from-layer="3129" from-port="2" to-layer="3150" to-port="0" /> + <edge from-layer="3130" from-port="2" to-layer="7230" to-port="0" /> + <edge from-layer="3130" from-port="2" to-layer="3191" to-port="1" /> + <edge from-layer="3131" from-port="0" to-layer="3136" to-port="0" /> + <edge from-layer="3132" from-port="0" to-layer="3135" to-port="1" /> + <edge from-layer="3133" from-port="0" to-layer="3135" to-port="2" /> + <edge from-layer="3134" from-port="0" to-layer="3135" to-port="3" /> + <edge from-layer="3135" from-port="4" to-layer="3136" to-port="1" /> + <edge from-layer="3136" from-port="2" to-layer="3137" to-port="0" /> + <edge from-layer="3137" from-port="1" to-layer="3139" to-port="0" /> + <edge from-layer="3138" from-port="0" to-layer="3139" to-port="2" /> + <edge from-layer="3139" from-port="3" to-layer="3146" to-port="0" /> + <edge from-layer="3140" from-port="0" to-layer="3143" to-port="1" /> + <edge from-layer="3141" from-port="0" to-layer="3143" to-port="2" /> + <edge from-layer="3142" from-port="0" to-layer="3143" to-port="3" /> + <edge from-layer="3143" from-port="4" to-layer="3145" to-port="0" /> + <edge from-layer="3144" from-port="0" to-layer="3145" to-port="1" /> + <edge from-layer="3145" from-port="2" to-layer="3146" to-port="1" /> + <edge from-layer="3146" from-port="2" to-layer="7229" to-port="0" /> + <edge from-layer="3146" from-port="2" to-layer="3191" to-port="2" /> + <edge from-layer="3147" from-port="0" to-layer="3169" to-port="0" /> + <edge from-layer="3148" from-port="0" to-layer="3163" to-port="0" /> + <edge from-layer="3149" from-port="0" to-layer="3167" to-port="1" /> + <edge from-layer="3149" from-port="0" to-layer="3163" to-port="1" /> + <edge from-layer="3150" from-port="1" to-layer="3153" to-port="0" /> + <edge from-layer="3151" from-port="0" to-layer="3153" to-port="1" /> + <edge from-layer="3152" from-port="0" to-layer="3153" to-port="2" /> + <edge from-layer="3153" from-port="3" to-layer="3154" to-port="1" /> + <edge from-layer="3154" from-port="2" to-layer="3159" to-port="0" /> + <edge from-layer="3154" from-port="2" to-layer="3166" to-port="0" /> + <edge from-layer="3155" from-port="1" to-layer="3184" to-port="0" /> + <edge from-layer="3155" from-port="1" to-layer="3158" to-port="0" /> + <edge from-layer="3156" from-port="0" to-layer="3158" to-port="1" /> + <edge from-layer="3157" from-port="0" to-layer="3158" to-port="2" /> + <edge from-layer="3158" from-port="3" to-layer="3159" to-port="1" /> + <edge from-layer="3159" from-port="2" to-layer="3161" to-port="0" /> + <edge from-layer="3160" from-port="0" to-layer="3161" to-port="1" /> + <edge from-layer="3161" from-port="2" to-layer="3163" to-port="2" /> + <edge from-layer="3162" from-port="0" to-layer="3163" to-port="3" /> + <edge from-layer="3162" from-port="0" to-layer="3167" to-port="3" /> + <edge from-layer="3163" from-port="4" to-layer="3169" to-port="1" /> + <edge from-layer="3164" from-port="0" to-layer="3167" to-port="0" /> + <edge from-layer="3165" from-port="0" to-layer="3166" to-port="1" /> + <edge from-layer="3166" from-port="2" to-layer="3167" to-port="2" /> + <edge from-layer="3166" from-port="2" to-layer="3174" to-port="2" /> + <edge from-layer="3167" from-port="4" to-layer="3169" to-port="2" /> + <edge from-layer="3168" from-port="0" to-layer="3169" to-port="3" /> + <edge from-layer="3169" from-port="4" to-layer="3176" to-port="0" /> + <edge from-layer="3170" from-port="0" to-layer="3176" to-port="1" /> + <edge from-layer="3171" from-port="0" to-layer="3174" to-port="0" /> + <edge from-layer="3172" from-port="0" to-layer="3174" to-port="1" /> + <edge from-layer="3173" from-port="0" to-layer="3174" to-port="3" /> + <edge from-layer="3174" from-port="4" to-layer="3176" to-port="2" /> + <edge from-layer="3175" from-port="0" to-layer="3176" to-port="3" /> + <edge from-layer="3176" from-port="4" to-layer="3179" to-port="0" /> + <edge from-layer="3177" from-port="0" to-layer="3179" to-port="1" /> + <edge from-layer="3178" from-port="0" to-layer="3179" to-port="2" /> + <edge from-layer="3179" from-port="3" to-layer="3180" to-port="0" /> + <edge from-layer="3180" from-port="2" to-layer="3181" to-port="0" /> + <edge from-layer="3180" from-port="2" to-layer="3190" to-port="0" /> + <edge from-layer="3181" from-port="1" to-layer="3189" to-port="0" /> + <edge from-layer="3182" from-port="0" to-layer="3184" to-port="1" /> + <edge from-layer="3183" from-port="0" to-layer="3184" to-port="2" /> + <edge from-layer="3184" from-port="3" to-layer="3188" to-port="0" /> + <edge from-layer="3185" from-port="0" to-layer="3188" to-port="1" /> + <edge from-layer="3186" from-port="0" to-layer="3188" to-port="2" /> + <edge from-layer="3187" from-port="0" to-layer="3188" to-port="3" /> + <edge from-layer="3188" from-port="4" to-layer="3189" to-port="1" /> + <edge from-layer="3189" from-port="2" to-layer="3190" to-port="1" /> + <edge from-layer="3190" from-port="2" to-layer="3191" to-port="3" /> + <edge from-layer="3191" from-port="4" to-layer="3193" to-port="0" /> + <edge from-layer="3192" from-port="0" to-layer="3193" to-port="1" /> + <edge from-layer="3193" from-port="2" to-layer="3195" to-port="0" /> + <edge from-layer="3194" from-port="0" to-layer="3195" to-port="1" /> + <edge from-layer="3195" from-port="2" to-layer="3204" to-port="0" /> + <edge from-layer="3196" from-port="0" to-layer="3197" to-port="0" /> + <edge from-layer="3197" from-port="1" to-layer="3200" to-port="0" /> + <edge from-layer="3198" from-port="0" to-layer="3199" to-port="0" /> + <edge from-layer="3199" from-port="1" to-layer="3200" to-port="1" /> + <edge from-layer="3200" from-port="2" to-layer="3202" to-port="0" /> + <edge from-layer="3201" from-port="0" to-layer="3202" to-port="1" /> + <edge from-layer="3202" from-port="2" to-layer="3203" to-port="0" /> + <edge from-layer="3203" from-port="1" to-layer="3204" to-port="1" /> + <edge from-layer="3204" from-port="2" to-layer="3206" to-port="0" /> + <edge from-layer="3205" from-port="0" to-layer="3206" to-port="1" /> + <edge from-layer="3206" from-port="2" to-layer="3207" to-port="0" /> + <edge from-layer="3207" from-port="2" to-layer="3209" to-port="0" /> + <edge from-layer="3207" from-port="2" to-layer="3237" to-port="1" /> + <edge from-layer="3208" from-port="0" to-layer="3209" to-port="1" /> + <edge from-layer="3209" from-port="2" to-layer="3211" to-port="0" /> + <edge from-layer="3210" from-port="0" to-layer="3211" to-port="1" /> + <edge from-layer="3211" from-port="2" to-layer="3213" to-port="0" /> + <edge from-layer="3212" from-port="0" to-layer="3213" to-port="1" /> + <edge from-layer="3213" from-port="2" to-layer="3222" to-port="0" /> + <edge from-layer="3214" from-port="0" to-layer="3215" to-port="0" /> + <edge from-layer="3215" from-port="1" to-layer="3218" to-port="0" /> + <edge from-layer="3216" from-port="0" to-layer="3217" to-port="0" /> + <edge from-layer="3217" from-port="1" to-layer="3218" to-port="1" /> + <edge from-layer="3218" from-port="2" to-layer="3220" to-port="0" /> + <edge from-layer="3219" from-port="0" to-layer="3220" to-port="1" /> + <edge from-layer="3220" from-port="2" to-layer="3221" to-port="0" /> + <edge from-layer="3221" from-port="1" to-layer="3222" to-port="1" /> + <edge from-layer="3222" from-port="2" to-layer="3224" to-port="0" /> + <edge from-layer="3223" from-port="0" to-layer="3224" to-port="1" /> + <edge from-layer="3224" from-port="2" to-layer="3225" to-port="0" /> + <edge from-layer="3225" from-port="1" to-layer="3234" to-port="0" /> + <edge from-layer="3226" from-port="0" to-layer="3227" to-port="0" /> + <edge from-layer="3227" from-port="1" to-layer="3230" to-port="0" /> + <edge from-layer="3228" from-port="0" to-layer="3229" to-port="0" /> + <edge from-layer="3229" from-port="1" to-layer="3230" to-port="1" /> + <edge from-layer="3230" from-port="2" to-layer="3232" to-port="0" /> + <edge from-layer="3231" from-port="0" to-layer="3232" to-port="1" /> + <edge from-layer="3232" from-port="2" to-layer="3233" to-port="0" /> + <edge from-layer="3233" from-port="1" to-layer="3234" to-port="1" /> + <edge from-layer="3234" from-port="2" to-layer="3236" to-port="0" /> + <edge from-layer="3235" from-port="0" to-layer="3236" to-port="1" /> + <edge from-layer="3236" from-port="2" to-layer="3237" to-port="0" /> + <edge from-layer="3237" from-port="2" to-layer="3239" to-port="0" /> + <edge from-layer="3237" from-port="2" to-layer="3434" to-port="1" /> + <edge from-layer="3238" from-port="0" to-layer="3239" to-port="1" /> + <edge from-layer="3239" from-port="2" to-layer="3241" to-port="0" /> + <edge from-layer="3240" from-port="0" to-layer="3241" to-port="1" /> + <edge from-layer="3241" from-port="2" to-layer="3243" to-port="0" /> + <edge from-layer="3242" from-port="0" to-layer="3243" to-port="1" /> + <edge from-layer="3243" from-port="2" to-layer="3252" to-port="0" /> + <edge from-layer="3244" from-port="0" to-layer="3245" to-port="0" /> + <edge from-layer="3245" from-port="1" to-layer="3248" to-port="0" /> + <edge from-layer="3246" from-port="0" to-layer="3247" to-port="0" /> + <edge from-layer="3247" from-port="1" to-layer="3248" to-port="1" /> + <edge from-layer="3248" from-port="2" to-layer="3250" to-port="0" /> + <edge from-layer="3249" from-port="0" to-layer="3250" to-port="1" /> + <edge from-layer="3250" from-port="2" to-layer="3251" to-port="0" /> + <edge from-layer="3251" from-port="1" to-layer="3252" to-port="1" /> + <edge from-layer="3252" from-port="2" to-layer="3254" to-port="0" /> + <edge from-layer="3253" from-port="0" to-layer="3254" to-port="1" /> + <edge from-layer="3254" from-port="2" to-layer="3256" to-port="0" /> + <edge from-layer="3255" from-port="0" to-layer="3256" to-port="1" /> + <edge from-layer="3256" from-port="2" to-layer="3272" to-port="0" /> + <edge from-layer="3256" from-port="2" to-layer="3370" to-port="0" /> + <edge from-layer="3256" from-port="2" to-layer="3260" to-port="0" /> + <edge from-layer="3257" from-port="0" to-layer="3260" to-port="1" /> + <edge from-layer="3258" from-port="0" to-layer="3260" to-port="2" /> + <edge from-layer="3259" from-port="0" to-layer="3260" to-port="3" /> + <edge from-layer="3260" from-port="4" to-layer="3262" to-port="0" /> + <edge from-layer="3261" from-port="0" to-layer="3262" to-port="1" /> + <edge from-layer="3262" from-port="2" to-layer="3266" to-port="0" /> + <edge from-layer="3263" from-port="0" to-layer="3266" to-port="1" /> + <edge from-layer="3264" from-port="0" to-layer="3266" to-port="2" /> + <edge from-layer="3265" from-port="0" to-layer="3266" to-port="3" /> + <edge from-layer="3266" from-port="4" to-layer="3317" to-port="0" /> + <edge from-layer="3266" from-port="4" to-layer="3301" to-port="0" /> + <edge from-layer="3266" from-port="4" to-layer="3298" to-port="0" /> + <edge from-layer="3266" from-port="4" to-layer="3312" to-port="0" /> + <edge from-layer="3267" from-port="0" to-layer="3294" to-port="0" /> + <edge from-layer="3268" from-port="0" to-layer="3294" to-port="1" /> + <edge from-layer="3269" from-port="0" to-layer="3272" to-port="1" /> + <edge from-layer="3270" from-port="0" to-layer="3272" to-port="2" /> + <edge from-layer="3271" from-port="0" to-layer="3272" to-port="3" /> + <edge from-layer="3272" from-port="4" to-layer="3329" to-port="0" /> + <edge from-layer="3272" from-port="4" to-layer="3273" to-port="0" /> + <edge from-layer="3273" from-port="1" to-layer="3276" to-port="0" /> + <edge from-layer="3274" from-port="0" to-layer="3276" to-port="1" /> + <edge from-layer="3275" from-port="0" to-layer="3276" to-port="2" /> + <edge from-layer="3276" from-port="3" to-layer="3292" to-port="0" /> + <edge from-layer="3277" from-port="0" to-layer="3282" to-port="0" /> + <edge from-layer="3278" from-port="0" to-layer="3281" to-port="1" /> + <edge from-layer="3279" from-port="0" to-layer="3281" to-port="2" /> + <edge from-layer="3280" from-port="0" to-layer="3281" to-port="3" /> + <edge from-layer="3281" from-port="4" to-layer="3282" to-port="1" /> + <edge from-layer="3282" from-port="2" to-layer="3283" to-port="0" /> + <edge from-layer="3283" from-port="1" to-layer="3285" to-port="0" /> + <edge from-layer="3284" from-port="0" to-layer="3285" to-port="2" /> + <edge from-layer="3285" from-port="3" to-layer="3286" to-port="0" /> + <edge from-layer="3285" from-port="3" to-layer="3357" to-port="0" /> + <edge from-layer="3286" from-port="1" to-layer="3289" to-port="0" /> + <edge from-layer="3287" from-port="0" to-layer="3289" to-port="1" /> + <edge from-layer="3288" from-port="0" to-layer="3289" to-port="2" /> + <edge from-layer="3289" from-port="3" to-layer="3291" to-port="0" /> + <edge from-layer="3289" from-port="3" to-layer="3381" to-port="0" /> + <edge from-layer="3290" from-port="0" to-layer="3291" to-port="1" /> + <edge from-layer="3291" from-port="2" to-layer="3292" to-port="1" /> + <edge from-layer="3292" from-port="2" to-layer="3294" to-port="2" /> + <edge from-layer="3292" from-port="2" to-layer="3322" to-port="2" /> + <edge from-layer="3293" from-port="0" to-layer="3294" to-port="3" /> + <edge from-layer="3294" from-port="4" to-layer="3296" to-port="0" /> + <edge from-layer="3295" from-port="0" to-layer="3296" to-port="2" /> + <edge from-layer="3296" from-port="3" to-layer="3297" to-port="0" /> + <edge from-layer="3297" from-port="2" to-layer="3334" to-port="1" /> + <edge from-layer="3297" from-port="2" to-layer="3298" to-port="1" /> + <edge from-layer="3298" from-port="2" to-layer="3327" to-port="0" /> + <edge from-layer="3299" from-port="0" to-layer="3309" to-port="0" /> + <edge from-layer="3300" from-port="0" to-layer="3309" to-port="1" /> + <edge from-layer="3301" from-port="1" to-layer="3303" to-port="0" /> + <edge from-layer="3302" from-port="0" to-layer="3303" to-port="2" /> + <edge from-layer="3303" from-port="3" to-layer="3304" to-port="0" /> + <edge from-layer="3304" from-port="2" to-layer="3305" to-port="0" /> + <edge from-layer="3305" from-port="1" to-layer="3307" to-port="0" /> + <edge from-layer="3306" from-port="0" to-layer="3307" to-port="1" /> + <edge from-layer="3307" from-port="2" to-layer="3309" to-port="2" /> + <edge from-layer="3308" from-port="0" to-layer="3309" to-port="3" /> + <edge from-layer="3309" from-port="4" to-layer="3317" to-port="2" /> + <edge from-layer="3309" from-port="4" to-layer="3312" to-port="1" /> + <edge from-layer="3310" from-port="0" to-layer="3312" to-port="2" /> + <edge from-layer="3311" from-port="0" to-layer="3312" to-port="3" /> + <edge from-layer="3312" from-port="4" to-layer="3314" to-port="0" /> + <edge from-layer="3313" from-port="0" to-layer="3314" to-port="1" /> + <edge from-layer="3314" from-port="2" to-layer="3318" to-port="0" /> + <edge from-layer="3315" from-port="0" to-layer="3317" to-port="1" /> + <edge from-layer="3316" from-port="0" to-layer="3317" to-port="3" /> + <edge from-layer="3317" from-port="4" to-layer="3318" to-port="1" /> + <edge from-layer="3318" from-port="2" to-layer="3326" to-port="0" /> + <edge from-layer="3319" from-port="0" to-layer="3322" to-port="0" /> + <edge from-layer="3320" from-port="0" to-layer="3322" to-port="1" /> + <edge from-layer="3321" from-port="0" to-layer="3322" to-port="3" /> + <edge from-layer="3322" from-port="4" to-layer="3324" to-port="0" /> + <edge from-layer="3323" from-port="0" to-layer="3324" to-port="2" /> + <edge from-layer="3324" from-port="3" to-layer="3325" to-port="0" /> + <edge from-layer="3325" from-port="2" to-layer="3326" to-port="1" /> + <edge from-layer="3325" from-port="2" to-layer="3355" to-port="1" /> + <edge from-layer="3326" from-port="2" to-layer="3327" to-port="1" /> + <edge from-layer="3327" from-port="2" to-layer="3382" to-port="0" /> + <edge from-layer="3327" from-port="2" to-layer="3418" to-port="0" /> + <edge from-layer="3328" from-port="0" to-layer="3329" to-port="1" /> + <edge from-layer="3329" from-port="2" to-layer="3333" to-port="0" /> + <edge from-layer="3330" from-port="0" to-layer="3333" to-port="1" /> + <edge from-layer="3331" from-port="0" to-layer="3333" to-port="2" /> + <edge from-layer="3332" from-port="0" to-layer="3333" to-port="3" /> + <edge from-layer="3333" from-port="4" to-layer="3334" to-port="0" /> + <edge from-layer="3333" from-port="4" to-layer="3337" to-port="0" /> + <edge from-layer="3333" from-port="4" to-layer="3348" to-port="0" /> + <edge from-layer="3333" from-port="4" to-layer="3353" to-port="0" /> + <edge from-layer="3334" from-port="2" to-layer="3356" to-port="0" /> + <edge from-layer="3335" from-port="0" to-layer="3345" to-port="0" /> + <edge from-layer="3336" from-port="0" to-layer="3345" to-port="1" /> + <edge from-layer="3337" from-port="1" to-layer="3339" to-port="0" /> + <edge from-layer="3338" from-port="0" to-layer="3339" to-port="2" /> + <edge from-layer="3339" from-port="3" to-layer="3340" to-port="0" /> + <edge from-layer="3340" from-port="2" to-layer="3341" to-port="0" /> + <edge from-layer="3341" from-port="1" to-layer="3343" to-port="0" /> + <edge from-layer="3342" from-port="0" to-layer="3343" to-port="1" /> + <edge from-layer="3343" from-port="2" to-layer="3345" to-port="2" /> + <edge from-layer="3344" from-port="0" to-layer="3345" to-port="3" /> + <edge from-layer="3345" from-port="4" to-layer="3348" to-port="1" /> + <edge from-layer="3345" from-port="4" to-layer="3353" to-port="2" /> + <edge from-layer="3346" from-port="0" to-layer="3348" to-port="2" /> + <edge from-layer="3347" from-port="0" to-layer="3348" to-port="3" /> + <edge from-layer="3348" from-port="4" to-layer="3350" to-port="0" /> + <edge from-layer="3349" from-port="0" to-layer="3350" to-port="1" /> + <edge from-layer="3350" from-port="2" to-layer="3354" to-port="0" /> + <edge from-layer="3351" from-port="0" to-layer="3353" to-port="1" /> + <edge from-layer="3352" from-port="0" to-layer="3353" to-port="3" /> + <edge from-layer="3353" from-port="4" to-layer="3354" to-port="1" /> + <edge from-layer="3354" from-port="2" to-layer="3355" to-port="0" /> + <edge from-layer="3355" from-port="2" to-layer="3356" to-port="1" /> + <edge from-layer="3356" from-port="2" to-layer="3377" to-port="0" /> + <edge from-layer="3356" from-port="2" to-layer="3357" to-port="1" /> + <edge from-layer="3357" from-port="2" to-layer="7228" to-port="0" /> + <edge from-layer="3357" from-port="2" to-layer="3418" to-port="1" /> + <edge from-layer="3358" from-port="0" to-layer="3363" to-port="0" /> + <edge from-layer="3359" from-port="0" to-layer="3362" to-port="1" /> + <edge from-layer="3360" from-port="0" to-layer="3362" to-port="2" /> + <edge from-layer="3361" from-port="0" to-layer="3362" to-port="3" /> + <edge from-layer="3362" from-port="4" to-layer="3363" to-port="1" /> + <edge from-layer="3363" from-port="2" to-layer="3364" to-port="0" /> + <edge from-layer="3364" from-port="1" to-layer="3366" to-port="0" /> + <edge from-layer="3365" from-port="0" to-layer="3366" to-port="2" /> + <edge from-layer="3366" from-port="3" to-layer="3373" to-port="0" /> + <edge from-layer="3367" from-port="0" to-layer="3370" to-port="1" /> + <edge from-layer="3368" from-port="0" to-layer="3370" to-port="2" /> + <edge from-layer="3369" from-port="0" to-layer="3370" to-port="3" /> + <edge from-layer="3370" from-port="4" to-layer="3372" to-port="0" /> + <edge from-layer="3371" from-port="0" to-layer="3372" to-port="1" /> + <edge from-layer="3372" from-port="2" to-layer="3373" to-port="1" /> + <edge from-layer="3373" from-port="2" to-layer="3418" to-port="2" /> + <edge from-layer="3373" from-port="2" to-layer="7227" to-port="0" /> + <edge from-layer="3374" from-port="0" to-layer="3396" to-port="0" /> + <edge from-layer="3375" from-port="0" to-layer="3390" to-port="0" /> + <edge from-layer="3376" from-port="0" to-layer="3394" to-port="1" /> + <edge from-layer="3376" from-port="0" to-layer="3390" to-port="1" /> + <edge from-layer="3377" from-port="1" to-layer="3380" to-port="0" /> + <edge from-layer="3378" from-port="0" to-layer="3380" to-port="1" /> + <edge from-layer="3379" from-port="0" to-layer="3380" to-port="2" /> + <edge from-layer="3380" from-port="3" to-layer="3381" to-port="1" /> + <edge from-layer="3381" from-port="2" to-layer="3393" to-port="0" /> + <edge from-layer="3381" from-port="2" to-layer="3386" to-port="0" /> + <edge from-layer="3382" from-port="1" to-layer="3411" to-port="0" /> + <edge from-layer="3382" from-port="1" to-layer="3385" to-port="0" /> + <edge from-layer="3383" from-port="0" to-layer="3385" to-port="1" /> + <edge from-layer="3384" from-port="0" to-layer="3385" to-port="2" /> + <edge from-layer="3385" from-port="3" to-layer="3386" to-port="1" /> + <edge from-layer="3386" from-port="2" to-layer="3388" to-port="0" /> + <edge from-layer="3387" from-port="0" to-layer="3388" to-port="1" /> + <edge from-layer="3388" from-port="2" to-layer="3390" to-port="2" /> + <edge from-layer="3389" from-port="0" to-layer="3394" to-port="3" /> + <edge from-layer="3389" from-port="0" to-layer="3390" to-port="3" /> + <edge from-layer="3390" from-port="4" to-layer="3396" to-port="1" /> + <edge from-layer="3391" from-port="0" to-layer="3394" to-port="0" /> + <edge from-layer="3392" from-port="0" to-layer="3393" to-port="1" /> + <edge from-layer="3393" from-port="2" to-layer="3394" to-port="2" /> + <edge from-layer="3393" from-port="2" to-layer="3401" to-port="2" /> + <edge from-layer="3394" from-port="4" to-layer="3396" to-port="2" /> + <edge from-layer="3395" from-port="0" to-layer="3396" to-port="3" /> + <edge from-layer="3396" from-port="4" to-layer="3403" to-port="0" /> + <edge from-layer="3397" from-port="0" to-layer="3403" to-port="1" /> + <edge from-layer="3398" from-port="0" to-layer="3401" to-port="0" /> + <edge from-layer="3399" from-port="0" to-layer="3401" to-port="1" /> + <edge from-layer="3400" from-port="0" to-layer="3401" to-port="3" /> + <edge from-layer="3401" from-port="4" to-layer="3403" to-port="2" /> + <edge from-layer="3402" from-port="0" to-layer="3403" to-port="3" /> + <edge from-layer="3403" from-port="4" to-layer="3406" to-port="0" /> + <edge from-layer="3404" from-port="0" to-layer="3406" to-port="1" /> + <edge from-layer="3405" from-port="0" to-layer="3406" to-port="2" /> + <edge from-layer="3406" from-port="3" to-layer="3407" to-port="0" /> + <edge from-layer="3407" from-port="2" to-layer="3408" to-port="0" /> + <edge from-layer="3407" from-port="2" to-layer="3417" to-port="0" /> + <edge from-layer="3408" from-port="1" to-layer="3416" to-port="0" /> + <edge from-layer="3409" from-port="0" to-layer="3411" to-port="1" /> + <edge from-layer="3410" from-port="0" to-layer="3411" to-port="2" /> + <edge from-layer="3411" from-port="3" to-layer="3415" to-port="0" /> + <edge from-layer="3412" from-port="0" to-layer="3415" to-port="1" /> + <edge from-layer="3413" from-port="0" to-layer="3415" to-port="2" /> + <edge from-layer="3414" from-port="0" to-layer="3415" to-port="3" /> + <edge from-layer="3415" from-port="4" to-layer="3416" to-port="1" /> + <edge from-layer="3416" from-port="2" to-layer="3417" to-port="1" /> + <edge from-layer="3417" from-port="2" to-layer="3418" to-port="3" /> + <edge from-layer="3418" from-port="4" to-layer="3420" to-port="0" /> + <edge from-layer="3419" from-port="0" to-layer="3420" to-port="1" /> + <edge from-layer="3420" from-port="2" to-layer="3422" to-port="0" /> + <edge from-layer="3421" from-port="0" to-layer="3422" to-port="1" /> + <edge from-layer="3422" from-port="2" to-layer="3431" to-port="0" /> + <edge from-layer="3423" from-port="0" to-layer="3424" to-port="0" /> + <edge from-layer="3424" from-port="1" to-layer="3427" to-port="0" /> + <edge from-layer="3425" from-port="0" to-layer="3426" to-port="0" /> + <edge from-layer="3426" from-port="1" to-layer="3427" to-port="1" /> + <edge from-layer="3427" from-port="2" to-layer="3429" to-port="0" /> + <edge from-layer="3428" from-port="0" to-layer="3429" to-port="1" /> + <edge from-layer="3429" from-port="2" to-layer="3430" to-port="0" /> + <edge from-layer="3430" from-port="1" to-layer="3431" to-port="1" /> + <edge from-layer="3431" from-port="2" to-layer="3433" to-port="0" /> + <edge from-layer="3432" from-port="0" to-layer="3433" to-port="1" /> + <edge from-layer="3433" from-port="2" to-layer="3434" to-port="0" /> + <edge from-layer="3434" from-port="2" to-layer="3464" to-port="1" /> + <edge from-layer="3434" from-port="2" to-layer="3436" to-port="0" /> + <edge from-layer="3435" from-port="0" to-layer="3436" to-port="1" /> + <edge from-layer="3436" from-port="2" to-layer="3438" to-port="0" /> + <edge from-layer="3437" from-port="0" to-layer="3438" to-port="1" /> + <edge from-layer="3438" from-port="2" to-layer="3440" to-port="0" /> + <edge from-layer="3439" from-port="0" to-layer="3440" to-port="1" /> + <edge from-layer="3440" from-port="2" to-layer="3449" to-port="0" /> + <edge from-layer="3441" from-port="0" to-layer="3442" to-port="0" /> + <edge from-layer="3442" from-port="1" to-layer="3445" to-port="0" /> + <edge from-layer="3443" from-port="0" to-layer="3444" to-port="0" /> + <edge from-layer="3444" from-port="1" to-layer="3445" to-port="1" /> + <edge from-layer="3445" from-port="2" to-layer="3447" to-port="0" /> + <edge from-layer="3446" from-port="0" to-layer="3447" to-port="1" /> + <edge from-layer="3447" from-port="2" to-layer="3448" to-port="0" /> + <edge from-layer="3448" from-port="1" to-layer="3449" to-port="1" /> + <edge from-layer="3449" from-port="2" to-layer="3451" to-port="0" /> + <edge from-layer="3450" from-port="0" to-layer="3451" to-port="1" /> + <edge from-layer="3451" from-port="2" to-layer="3452" to-port="0" /> + <edge from-layer="3452" from-port="1" to-layer="3461" to-port="0" /> + <edge from-layer="3453" from-port="0" to-layer="3454" to-port="0" /> + <edge from-layer="3454" from-port="1" to-layer="3457" to-port="0" /> + <edge from-layer="3455" from-port="0" to-layer="3456" to-port="0" /> + <edge from-layer="3456" from-port="1" to-layer="3457" to-port="1" /> + <edge from-layer="3457" from-port="2" to-layer="3459" to-port="0" /> + <edge from-layer="3458" from-port="0" to-layer="3459" to-port="1" /> + <edge from-layer="3459" from-port="2" to-layer="3460" to-port="0" /> + <edge from-layer="3460" from-port="1" to-layer="3461" to-port="1" /> + <edge from-layer="3461" from-port="2" to-layer="3463" to-port="0" /> + <edge from-layer="3462" from-port="0" to-layer="3463" to-port="1" /> + <edge from-layer="3463" from-port="2" to-layer="3464" to-port="0" /> + <edge from-layer="3464" from-port="2" to-layer="3661" to-port="1" /> + <edge from-layer="3464" from-port="2" to-layer="3466" to-port="0" /> + <edge from-layer="3465" from-port="0" to-layer="3466" to-port="1" /> + <edge from-layer="3466" from-port="2" to-layer="3468" to-port="0" /> + <edge from-layer="3467" from-port="0" to-layer="3468" to-port="1" /> + <edge from-layer="3468" from-port="2" to-layer="3470" to-port="0" /> + <edge from-layer="3469" from-port="0" to-layer="3470" to-port="1" /> + <edge from-layer="3470" from-port="2" to-layer="3479" to-port="0" /> + <edge from-layer="3471" from-port="0" to-layer="3472" to-port="0" /> + <edge from-layer="3472" from-port="1" to-layer="3475" to-port="0" /> + <edge from-layer="3473" from-port="0" to-layer="3474" to-port="0" /> + <edge from-layer="3474" from-port="1" to-layer="3475" to-port="1" /> + <edge from-layer="3475" from-port="2" to-layer="3477" to-port="0" /> + <edge from-layer="3476" from-port="0" to-layer="3477" to-port="1" /> + <edge from-layer="3477" from-port="2" to-layer="3478" to-port="0" /> + <edge from-layer="3478" from-port="1" to-layer="3479" to-port="1" /> + <edge from-layer="3479" from-port="2" to-layer="3481" to-port="0" /> + <edge from-layer="3480" from-port="0" to-layer="3481" to-port="1" /> + <edge from-layer="3481" from-port="2" to-layer="3483" to-port="0" /> + <edge from-layer="3482" from-port="0" to-layer="3483" to-port="1" /> + <edge from-layer="3483" from-port="2" to-layer="3487" to-port="0" /> + <edge from-layer="3483" from-port="2" to-layer="3597" to-port="0" /> + <edge from-layer="3483" from-port="2" to-layer="3499" to-port="0" /> + <edge from-layer="3484" from-port="0" to-layer="3487" to-port="1" /> + <edge from-layer="3485" from-port="0" to-layer="3487" to-port="2" /> + <edge from-layer="3486" from-port="0" to-layer="3487" to-port="3" /> + <edge from-layer="3487" from-port="4" to-layer="3489" to-port="0" /> + <edge from-layer="3488" from-port="0" to-layer="3489" to-port="1" /> + <edge from-layer="3489" from-port="2" to-layer="3493" to-port="0" /> + <edge from-layer="3490" from-port="0" to-layer="3493" to-port="1" /> + <edge from-layer="3491" from-port="0" to-layer="3493" to-port="2" /> + <edge from-layer="3492" from-port="0" to-layer="3493" to-port="3" /> + <edge from-layer="3493" from-port="4" to-layer="3525" to-port="0" /> + <edge from-layer="3493" from-port="4" to-layer="3528" to-port="0" /> + <edge from-layer="3493" from-port="4" to-layer="3539" to-port="0" /> + <edge from-layer="3493" from-port="4" to-layer="3544" to-port="0" /> + <edge from-layer="3494" from-port="0" to-layer="3521" to-port="0" /> + <edge from-layer="3495" from-port="0" to-layer="3521" to-port="1" /> + <edge from-layer="3496" from-port="0" to-layer="3499" to-port="1" /> + <edge from-layer="3497" from-port="0" to-layer="3499" to-port="2" /> + <edge from-layer="3498" from-port="0" to-layer="3499" to-port="3" /> + <edge from-layer="3499" from-port="4" to-layer="3500" to-port="0" /> + <edge from-layer="3499" from-port="4" to-layer="3556" to-port="0" /> + <edge from-layer="3500" from-port="1" to-layer="3503" to-port="0" /> + <edge from-layer="3501" from-port="0" to-layer="3503" to-port="1" /> + <edge from-layer="3502" from-port="0" to-layer="3503" to-port="2" /> + <edge from-layer="3503" from-port="3" to-layer="3519" to-port="0" /> + <edge from-layer="3504" from-port="0" to-layer="3509" to-port="0" /> + <edge from-layer="3505" from-port="0" to-layer="3508" to-port="1" /> + <edge from-layer="3506" from-port="0" to-layer="3508" to-port="2" /> + <edge from-layer="3507" from-port="0" to-layer="3508" to-port="3" /> + <edge from-layer="3508" from-port="4" to-layer="3509" to-port="1" /> + <edge from-layer="3509" from-port="2" to-layer="3510" to-port="0" /> + <edge from-layer="3510" from-port="1" to-layer="3512" to-port="0" /> + <edge from-layer="3511" from-port="0" to-layer="3512" to-port="2" /> + <edge from-layer="3512" from-port="3" to-layer="3513" to-port="0" /> + <edge from-layer="3512" from-port="3" to-layer="3584" to-port="0" /> + <edge from-layer="3513" from-port="1" to-layer="3516" to-port="0" /> + <edge from-layer="3514" from-port="0" to-layer="3516" to-port="1" /> + <edge from-layer="3515" from-port="0" to-layer="3516" to-port="2" /> + <edge from-layer="3516" from-port="3" to-layer="3608" to-port="0" /> + <edge from-layer="3516" from-port="3" to-layer="3518" to-port="0" /> + <edge from-layer="3517" from-port="0" to-layer="3518" to-port="1" /> + <edge from-layer="3518" from-port="2" to-layer="3519" to-port="1" /> + <edge from-layer="3519" from-port="2" to-layer="3549" to-port="2" /> + <edge from-layer="3519" from-port="2" to-layer="3521" to-port="2" /> + <edge from-layer="3520" from-port="0" to-layer="3521" to-port="3" /> + <edge from-layer="3521" from-port="4" to-layer="3523" to-port="0" /> + <edge from-layer="3522" from-port="0" to-layer="3523" to-port="2" /> + <edge from-layer="3523" from-port="3" to-layer="3524" to-port="0" /> + <edge from-layer="3524" from-port="2" to-layer="3525" to-port="1" /> + <edge from-layer="3524" from-port="2" to-layer="3561" to-port="1" /> + <edge from-layer="3525" from-port="2" to-layer="3554" to-port="0" /> + <edge from-layer="3526" from-port="0" to-layer="3536" to-port="0" /> + <edge from-layer="3527" from-port="0" to-layer="3536" to-port="1" /> + <edge from-layer="3528" from-port="1" to-layer="3530" to-port="0" /> + <edge from-layer="3529" from-port="0" to-layer="3530" to-port="2" /> + <edge from-layer="3530" from-port="3" to-layer="3531" to-port="0" /> + <edge from-layer="3531" from-port="2" to-layer="3532" to-port="0" /> + <edge from-layer="3532" from-port="1" to-layer="3534" to-port="0" /> + <edge from-layer="3533" from-port="0" to-layer="3534" to-port="1" /> + <edge from-layer="3534" from-port="2" to-layer="3536" to-port="2" /> + <edge from-layer="3535" from-port="0" to-layer="3536" to-port="3" /> + <edge from-layer="3536" from-port="4" to-layer="3539" to-port="1" /> + <edge from-layer="3536" from-port="4" to-layer="3544" to-port="2" /> + <edge from-layer="3537" from-port="0" to-layer="3539" to-port="2" /> + <edge from-layer="3538" from-port="0" to-layer="3539" to-port="3" /> + <edge from-layer="3539" from-port="4" to-layer="3541" to-port="0" /> + <edge from-layer="3540" from-port="0" to-layer="3541" to-port="1" /> + <edge from-layer="3541" from-port="2" to-layer="3545" to-port="0" /> + <edge from-layer="3542" from-port="0" to-layer="3544" to-port="1" /> + <edge from-layer="3543" from-port="0" to-layer="3544" to-port="3" /> + <edge from-layer="3544" from-port="4" to-layer="3545" to-port="1" /> + <edge from-layer="3545" from-port="2" to-layer="3553" to-port="0" /> + <edge from-layer="3546" from-port="0" to-layer="3549" to-port="0" /> + <edge from-layer="3547" from-port="0" to-layer="3549" to-port="1" /> + <edge from-layer="3548" from-port="0" to-layer="3549" to-port="3" /> + <edge from-layer="3549" from-port="4" to-layer="3551" to-port="0" /> + <edge from-layer="3550" from-port="0" to-layer="3551" to-port="2" /> + <edge from-layer="3551" from-port="3" to-layer="3552" to-port="0" /> + <edge from-layer="3552" from-port="2" to-layer="3553" to-port="1" /> + <edge from-layer="3552" from-port="2" to-layer="3582" to-port="1" /> + <edge from-layer="3553" from-port="2" to-layer="3554" to-port="1" /> + <edge from-layer="3554" from-port="2" to-layer="3645" to-port="0" /> + <edge from-layer="3554" from-port="2" to-layer="3609" to-port="0" /> + <edge from-layer="3555" from-port="0" to-layer="3556" to-port="1" /> + <edge from-layer="3556" from-port="2" to-layer="3560" to-port="0" /> + <edge from-layer="3557" from-port="0" to-layer="3560" to-port="1" /> + <edge from-layer="3558" from-port="0" to-layer="3560" to-port="2" /> + <edge from-layer="3559" from-port="0" to-layer="3560" to-port="3" /> + <edge from-layer="3560" from-port="4" to-layer="3575" to-port="0" /> + <edge from-layer="3560" from-port="4" to-layer="3580" to-port="0" /> + <edge from-layer="3560" from-port="4" to-layer="3561" to-port="0" /> + <edge from-layer="3560" from-port="4" to-layer="3564" to-port="0" /> + <edge from-layer="3561" from-port="2" to-layer="3583" to-port="0" /> + <edge from-layer="3562" from-port="0" to-layer="3572" to-port="0" /> + <edge from-layer="3563" from-port="0" to-layer="3572" to-port="1" /> + <edge from-layer="3564" from-port="1" to-layer="3566" to-port="0" /> + <edge from-layer="3565" from-port="0" to-layer="3566" to-port="2" /> + <edge from-layer="3566" from-port="3" to-layer="3567" to-port="0" /> + <edge from-layer="3567" from-port="2" to-layer="3568" to-port="0" /> + <edge from-layer="3568" from-port="1" to-layer="3570" to-port="0" /> + <edge from-layer="3569" from-port="0" to-layer="3570" to-port="1" /> + <edge from-layer="3570" from-port="2" to-layer="3572" to-port="2" /> + <edge from-layer="3571" from-port="0" to-layer="3572" to-port="3" /> + <edge from-layer="3572" from-port="4" to-layer="3575" to-port="1" /> + <edge from-layer="3572" from-port="4" to-layer="3580" to-port="2" /> + <edge from-layer="3573" from-port="0" to-layer="3575" to-port="2" /> + <edge from-layer="3574" from-port="0" to-layer="3575" to-port="3" /> + <edge from-layer="3575" from-port="4" to-layer="3577" to-port="0" /> + <edge from-layer="3576" from-port="0" to-layer="3577" to-port="1" /> + <edge from-layer="3577" from-port="2" to-layer="3581" to-port="0" /> + <edge from-layer="3578" from-port="0" to-layer="3580" to-port="1" /> + <edge from-layer="3579" from-port="0" to-layer="3580" to-port="3" /> + <edge from-layer="3580" from-port="4" to-layer="3581" to-port="1" /> + <edge from-layer="3581" from-port="2" to-layer="3582" to-port="0" /> + <edge from-layer="3582" from-port="2" to-layer="3583" to-port="1" /> + <edge from-layer="3583" from-port="2" to-layer="3604" to-port="0" /> + <edge from-layer="3583" from-port="2" to-layer="3584" to-port="1" /> + <edge from-layer="3584" from-port="2" to-layer="3645" to-port="1" /> + <edge from-layer="3584" from-port="2" to-layer="7226" to-port="0" /> + <edge from-layer="3585" from-port="0" to-layer="3590" to-port="0" /> + <edge from-layer="3586" from-port="0" to-layer="3589" to-port="1" /> + <edge from-layer="3587" from-port="0" to-layer="3589" to-port="2" /> + <edge from-layer="3588" from-port="0" to-layer="3589" to-port="3" /> + <edge from-layer="3589" from-port="4" to-layer="3590" to-port="1" /> + <edge from-layer="3590" from-port="2" to-layer="3591" to-port="0" /> + <edge from-layer="3591" from-port="1" to-layer="3593" to-port="0" /> + <edge from-layer="3592" from-port="0" to-layer="3593" to-port="2" /> + <edge from-layer="3593" from-port="3" to-layer="3600" to-port="0" /> + <edge from-layer="3594" from-port="0" to-layer="3597" to-port="1" /> + <edge from-layer="3595" from-port="0" to-layer="3597" to-port="2" /> + <edge from-layer="3596" from-port="0" to-layer="3597" to-port="3" /> + <edge from-layer="3597" from-port="4" to-layer="3599" to-port="0" /> + <edge from-layer="3598" from-port="0" to-layer="3599" to-port="1" /> + <edge from-layer="3599" from-port="2" to-layer="3600" to-port="1" /> + <edge from-layer="3600" from-port="2" to-layer="7225" to-port="0" /> + <edge from-layer="3600" from-port="2" to-layer="3645" to-port="2" /> + <edge from-layer="3601" from-port="0" to-layer="3623" to-port="0" /> + <edge from-layer="3602" from-port="0" to-layer="3617" to-port="0" /> + <edge from-layer="3603" from-port="0" to-layer="3621" to-port="1" /> + <edge from-layer="3603" from-port="0" to-layer="3617" to-port="1" /> + <edge from-layer="3604" from-port="1" to-layer="3607" to-port="0" /> + <edge from-layer="3605" from-port="0" to-layer="3607" to-port="1" /> + <edge from-layer="3606" from-port="0" to-layer="3607" to-port="2" /> + <edge from-layer="3607" from-port="3" to-layer="3608" to-port="1" /> + <edge from-layer="3608" from-port="2" to-layer="3613" to-port="0" /> + <edge from-layer="3608" from-port="2" to-layer="3620" to-port="0" /> + <edge from-layer="3609" from-port="1" to-layer="3612" to-port="0" /> + <edge from-layer="3609" from-port="1" to-layer="3638" to-port="0" /> + <edge from-layer="3610" from-port="0" to-layer="3612" to-port="1" /> + <edge from-layer="3611" from-port="0" to-layer="3612" to-port="2" /> + <edge from-layer="3612" from-port="3" to-layer="3613" to-port="1" /> + <edge from-layer="3613" from-port="2" to-layer="3615" to-port="0" /> + <edge from-layer="3614" from-port="0" to-layer="3615" to-port="1" /> + <edge from-layer="3615" from-port="2" to-layer="3617" to-port="2" /> + <edge from-layer="3616" from-port="0" to-layer="3617" to-port="3" /> + <edge from-layer="3616" from-port="0" to-layer="3621" to-port="3" /> + <edge from-layer="3617" from-port="4" to-layer="3623" to-port="1" /> + <edge from-layer="3618" from-port="0" to-layer="3621" to-port="0" /> + <edge from-layer="3619" from-port="0" to-layer="3620" to-port="1" /> + <edge from-layer="3620" from-port="2" to-layer="3628" to-port="2" /> + <edge from-layer="3620" from-port="2" to-layer="3621" to-port="2" /> + <edge from-layer="3621" from-port="4" to-layer="3623" to-port="2" /> + <edge from-layer="3622" from-port="0" to-layer="3623" to-port="3" /> + <edge from-layer="3623" from-port="4" to-layer="3630" to-port="0" /> + <edge from-layer="3624" from-port="0" to-layer="3630" to-port="1" /> + <edge from-layer="3625" from-port="0" to-layer="3628" to-port="0" /> + <edge from-layer="3626" from-port="0" to-layer="3628" to-port="1" /> + <edge from-layer="3627" from-port="0" to-layer="3628" to-port="3" /> + <edge from-layer="3628" from-port="4" to-layer="3630" to-port="2" /> + <edge from-layer="3629" from-port="0" to-layer="3630" to-port="3" /> + <edge from-layer="3630" from-port="4" to-layer="3633" to-port="0" /> + <edge from-layer="3631" from-port="0" to-layer="3633" to-port="1" /> + <edge from-layer="3632" from-port="0" to-layer="3633" to-port="2" /> + <edge from-layer="3633" from-port="3" to-layer="3634" to-port="0" /> + <edge from-layer="3634" from-port="2" to-layer="3635" to-port="0" /> + <edge from-layer="3634" from-port="2" to-layer="3644" to-port="0" /> + <edge from-layer="3635" from-port="1" to-layer="3643" to-port="0" /> + <edge from-layer="3636" from-port="0" to-layer="3638" to-port="1" /> + <edge from-layer="3637" from-port="0" to-layer="3638" to-port="2" /> + <edge from-layer="3638" from-port="3" to-layer="3642" to-port="0" /> + <edge from-layer="3639" from-port="0" to-layer="3642" to-port="1" /> + <edge from-layer="3640" from-port="0" to-layer="3642" to-port="2" /> + <edge from-layer="3641" from-port="0" to-layer="3642" to-port="3" /> + <edge from-layer="3642" from-port="4" to-layer="3643" to-port="1" /> + <edge from-layer="3643" from-port="2" to-layer="3644" to-port="1" /> + <edge from-layer="3644" from-port="2" to-layer="3645" to-port="3" /> + <edge from-layer="3645" from-port="4" to-layer="3647" to-port="0" /> + <edge from-layer="3646" from-port="0" to-layer="3647" to-port="1" /> + <edge from-layer="3647" from-port="2" to-layer="3649" to-port="0" /> + <edge from-layer="3648" from-port="0" to-layer="3649" to-port="1" /> + <edge from-layer="3649" from-port="2" to-layer="3658" to-port="0" /> + <edge from-layer="3650" from-port="0" to-layer="3651" to-port="0" /> + <edge from-layer="3651" from-port="1" to-layer="3654" to-port="0" /> + <edge from-layer="3652" from-port="0" to-layer="3653" to-port="0" /> + <edge from-layer="3653" from-port="1" to-layer="3654" to-port="1" /> + <edge from-layer="3654" from-port="2" to-layer="3656" to-port="0" /> + <edge from-layer="3655" from-port="0" to-layer="3656" to-port="1" /> + <edge from-layer="3656" from-port="2" to-layer="3657" to-port="0" /> + <edge from-layer="3657" from-port="1" to-layer="3658" to-port="1" /> + <edge from-layer="3658" from-port="2" to-layer="3660" to-port="0" /> + <edge from-layer="3659" from-port="0" to-layer="3660" to-port="1" /> + <edge from-layer="3660" from-port="2" to-layer="3661" to-port="0" /> + <edge from-layer="3661" from-port="2" to-layer="3691" to-port="1" /> + <edge from-layer="3661" from-port="2" to-layer="3663" to-port="0" /> + <edge from-layer="3662" from-port="0" to-layer="3663" to-port="1" /> + <edge from-layer="3663" from-port="2" to-layer="3665" to-port="0" /> + <edge from-layer="3664" from-port="0" to-layer="3665" to-port="1" /> + <edge from-layer="3665" from-port="2" to-layer="3667" to-port="0" /> + <edge from-layer="3666" from-port="0" to-layer="3667" to-port="1" /> + <edge from-layer="3667" from-port="2" to-layer="3676" to-port="0" /> + <edge from-layer="3668" from-port="0" to-layer="3669" to-port="0" /> + <edge from-layer="3669" from-port="1" to-layer="3672" to-port="0" /> + <edge from-layer="3670" from-port="0" to-layer="3671" to-port="0" /> + <edge from-layer="3671" from-port="1" to-layer="3672" to-port="1" /> + <edge from-layer="3672" from-port="2" to-layer="3674" to-port="0" /> + <edge from-layer="3673" from-port="0" to-layer="3674" to-port="1" /> + <edge from-layer="3674" from-port="2" to-layer="3675" to-port="0" /> + <edge from-layer="3675" from-port="1" to-layer="3676" to-port="1" /> + <edge from-layer="3676" from-port="2" to-layer="3678" to-port="0" /> + <edge from-layer="3677" from-port="0" to-layer="3678" to-port="1" /> + <edge from-layer="3678" from-port="2" to-layer="3679" to-port="0" /> + <edge from-layer="3679" from-port="1" to-layer="3688" to-port="0" /> + <edge from-layer="3680" from-port="0" to-layer="3681" to-port="0" /> + <edge from-layer="3681" from-port="1" to-layer="3684" to-port="0" /> + <edge from-layer="3682" from-port="0" to-layer="3683" to-port="0" /> + <edge from-layer="3683" from-port="1" to-layer="3684" to-port="1" /> + <edge from-layer="3684" from-port="2" to-layer="3686" to-port="0" /> + <edge from-layer="3685" from-port="0" to-layer="3686" to-port="1" /> + <edge from-layer="3686" from-port="2" to-layer="3687" to-port="0" /> + <edge from-layer="3687" from-port="1" to-layer="3688" to-port="1" /> + <edge from-layer="3688" from-port="2" to-layer="3690" to-port="0" /> + <edge from-layer="3689" from-port="0" to-layer="3690" to-port="1" /> + <edge from-layer="3690" from-port="2" to-layer="3691" to-port="0" /> + <edge from-layer="3691" from-port="2" to-layer="3888" to-port="1" /> + <edge from-layer="3691" from-port="2" to-layer="3693" to-port="0" /> + <edge from-layer="3692" from-port="0" to-layer="3693" to-port="1" /> + <edge from-layer="3693" from-port="2" to-layer="3695" to-port="0" /> + <edge from-layer="3694" from-port="0" to-layer="3695" to-port="1" /> + <edge from-layer="3695" from-port="2" to-layer="3697" to-port="0" /> + <edge from-layer="3696" from-port="0" to-layer="3697" to-port="1" /> + <edge from-layer="3697" from-port="2" to-layer="3706" to-port="0" /> + <edge from-layer="3698" from-port="0" to-layer="3699" to-port="0" /> + <edge from-layer="3699" from-port="1" to-layer="3702" to-port="0" /> + <edge from-layer="3700" from-port="0" to-layer="3701" to-port="0" /> + <edge from-layer="3701" from-port="1" to-layer="3702" to-port="1" /> + <edge from-layer="3702" from-port="2" to-layer="3704" to-port="0" /> + <edge from-layer="3703" from-port="0" to-layer="3704" to-port="1" /> + <edge from-layer="3704" from-port="2" to-layer="3705" to-port="0" /> + <edge from-layer="3705" from-port="1" to-layer="3706" to-port="1" /> + <edge from-layer="3706" from-port="2" to-layer="3708" to-port="0" /> + <edge from-layer="3707" from-port="0" to-layer="3708" to-port="1" /> + <edge from-layer="3708" from-port="2" to-layer="3710" to-port="0" /> + <edge from-layer="3709" from-port="0" to-layer="3710" to-port="1" /> + <edge from-layer="3710" from-port="2" to-layer="3824" to-port="0" /> + <edge from-layer="3710" from-port="2" to-layer="3726" to-port="0" /> + <edge from-layer="3710" from-port="2" to-layer="3714" to-port="0" /> + <edge from-layer="3711" from-port="0" to-layer="3714" to-port="1" /> + <edge from-layer="3712" from-port="0" to-layer="3714" to-port="2" /> + <edge from-layer="3713" from-port="0" to-layer="3714" to-port="3" /> + <edge from-layer="3714" from-port="4" to-layer="3716" to-port="0" /> + <edge from-layer="3715" from-port="0" to-layer="3716" to-port="1" /> + <edge from-layer="3716" from-port="2" to-layer="3720" to-port="0" /> + <edge from-layer="3717" from-port="0" to-layer="3720" to-port="1" /> + <edge from-layer="3718" from-port="0" to-layer="3720" to-port="2" /> + <edge from-layer="3719" from-port="0" to-layer="3720" to-port="3" /> + <edge from-layer="3720" from-port="4" to-layer="3752" to-port="0" /> + <edge from-layer="3720" from-port="4" to-layer="3771" to-port="0" /> + <edge from-layer="3720" from-port="4" to-layer="3755" to-port="0" /> + <edge from-layer="3720" from-port="4" to-layer="3766" to-port="0" /> + <edge from-layer="3721" from-port="0" to-layer="3748" to-port="0" /> + <edge from-layer="3722" from-port="0" to-layer="3748" to-port="1" /> + <edge from-layer="3723" from-port="0" to-layer="3726" to-port="1" /> + <edge from-layer="3724" from-port="0" to-layer="3726" to-port="2" /> + <edge from-layer="3725" from-port="0" to-layer="3726" to-port="3" /> + <edge from-layer="3726" from-port="4" to-layer="3783" to-port="0" /> + <edge from-layer="3726" from-port="4" to-layer="3727" to-port="0" /> + <edge from-layer="3727" from-port="1" to-layer="3730" to-port="0" /> + <edge from-layer="3728" from-port="0" to-layer="3730" to-port="1" /> + <edge from-layer="3729" from-port="0" to-layer="3730" to-port="2" /> + <edge from-layer="3730" from-port="3" to-layer="3746" to-port="0" /> + <edge from-layer="3731" from-port="0" to-layer="3736" to-port="0" /> + <edge from-layer="3732" from-port="0" to-layer="3735" to-port="1" /> + <edge from-layer="3733" from-port="0" to-layer="3735" to-port="2" /> + <edge from-layer="3734" from-port="0" to-layer="3735" to-port="3" /> + <edge from-layer="3735" from-port="4" to-layer="3736" to-port="1" /> + <edge from-layer="3736" from-port="2" to-layer="3737" to-port="0" /> + <edge from-layer="3737" from-port="1" to-layer="3739" to-port="0" /> + <edge from-layer="3738" from-port="0" to-layer="3739" to-port="2" /> + <edge from-layer="3739" from-port="3" to-layer="3740" to-port="0" /> + <edge from-layer="3739" from-port="3" to-layer="3811" to-port="0" /> + <edge from-layer="3740" from-port="1" to-layer="3743" to-port="0" /> + <edge from-layer="3741" from-port="0" to-layer="3743" to-port="1" /> + <edge from-layer="3742" from-port="0" to-layer="3743" to-port="2" /> + <edge from-layer="3743" from-port="3" to-layer="3745" to-port="0" /> + <edge from-layer="3743" from-port="3" to-layer="3835" to-port="0" /> + <edge from-layer="3744" from-port="0" to-layer="3745" to-port="1" /> + <edge from-layer="3745" from-port="2" to-layer="3746" to-port="1" /> + <edge from-layer="3746" from-port="2" to-layer="3748" to-port="2" /> + <edge from-layer="3746" from-port="2" to-layer="3776" to-port="2" /> + <edge from-layer="3747" from-port="0" to-layer="3748" to-port="3" /> + <edge from-layer="3748" from-port="4" to-layer="3750" to-port="0" /> + <edge from-layer="3749" from-port="0" to-layer="3750" to-port="2" /> + <edge from-layer="3750" from-port="3" to-layer="3751" to-port="0" /> + <edge from-layer="3751" from-port="2" to-layer="3788" to-port="1" /> + <edge from-layer="3751" from-port="2" to-layer="3752" to-port="1" /> + <edge from-layer="3752" from-port="2" to-layer="3781" to-port="0" /> + <edge from-layer="3753" from-port="0" to-layer="3763" to-port="0" /> + <edge from-layer="3754" from-port="0" to-layer="3763" to-port="1" /> + <edge from-layer="3755" from-port="1" to-layer="3757" to-port="0" /> + <edge from-layer="3756" from-port="0" to-layer="3757" to-port="2" /> + <edge from-layer="3757" from-port="3" to-layer="3758" to-port="0" /> + <edge from-layer="3758" from-port="2" to-layer="3759" to-port="0" /> + <edge from-layer="3759" from-port="1" to-layer="3761" to-port="0" /> + <edge from-layer="3760" from-port="0" to-layer="3761" to-port="1" /> + <edge from-layer="3761" from-port="2" to-layer="3763" to-port="2" /> + <edge from-layer="3762" from-port="0" to-layer="3763" to-port="3" /> + <edge from-layer="3763" from-port="4" to-layer="3766" to-port="1" /> + <edge from-layer="3763" from-port="4" to-layer="3771" to-port="2" /> + <edge from-layer="3764" from-port="0" to-layer="3766" to-port="2" /> + <edge from-layer="3765" from-port="0" to-layer="3766" to-port="3" /> + <edge from-layer="3766" from-port="4" to-layer="3768" to-port="0" /> + <edge from-layer="3767" from-port="0" to-layer="3768" to-port="1" /> + <edge from-layer="3768" from-port="2" to-layer="3772" to-port="0" /> + <edge from-layer="3769" from-port="0" to-layer="3771" to-port="1" /> + <edge from-layer="3770" from-port="0" to-layer="3771" to-port="3" /> + <edge from-layer="3771" from-port="4" to-layer="3772" to-port="1" /> + <edge from-layer="3772" from-port="2" to-layer="3780" to-port="0" /> + <edge from-layer="3773" from-port="0" to-layer="3776" to-port="0" /> + <edge from-layer="3774" from-port="0" to-layer="3776" to-port="1" /> + <edge from-layer="3775" from-port="0" to-layer="3776" to-port="3" /> + <edge from-layer="3776" from-port="4" to-layer="3778" to-port="0" /> + <edge from-layer="3777" from-port="0" to-layer="3778" to-port="2" /> + <edge from-layer="3778" from-port="3" to-layer="3779" to-port="0" /> + <edge from-layer="3779" from-port="2" to-layer="3780" to-port="1" /> + <edge from-layer="3779" from-port="2" to-layer="3809" to-port="1" /> + <edge from-layer="3780" from-port="2" to-layer="3781" to-port="1" /> + <edge from-layer="3781" from-port="2" to-layer="3872" to-port="0" /> + <edge from-layer="3781" from-port="2" to-layer="3836" to-port="0" /> + <edge from-layer="3782" from-port="0" to-layer="3783" to-port="1" /> + <edge from-layer="3783" from-port="2" to-layer="3787" to-port="0" /> + <edge from-layer="3784" from-port="0" to-layer="3787" to-port="1" /> + <edge from-layer="3785" from-port="0" to-layer="3787" to-port="2" /> + <edge from-layer="3786" from-port="0" to-layer="3787" to-port="3" /> + <edge from-layer="3787" from-port="4" to-layer="3807" to-port="0" /> + <edge from-layer="3787" from-port="4" to-layer="3788" to-port="0" /> + <edge from-layer="3787" from-port="4" to-layer="3791" to-port="0" /> + <edge from-layer="3787" from-port="4" to-layer="3802" to-port="0" /> + <edge from-layer="3788" from-port="2" to-layer="3810" to-port="0" /> + <edge from-layer="3789" from-port="0" to-layer="3799" to-port="0" /> + <edge from-layer="3790" from-port="0" to-layer="3799" to-port="1" /> + <edge from-layer="3791" from-port="1" to-layer="3793" to-port="0" /> + <edge from-layer="3792" from-port="0" to-layer="3793" to-port="2" /> + <edge from-layer="3793" from-port="3" to-layer="3794" to-port="0" /> + <edge from-layer="3794" from-port="2" to-layer="3795" to-port="0" /> + <edge from-layer="3795" from-port="1" to-layer="3797" to-port="0" /> + <edge from-layer="3796" from-port="0" to-layer="3797" to-port="1" /> + <edge from-layer="3797" from-port="2" to-layer="3799" to-port="2" /> + <edge from-layer="3798" from-port="0" to-layer="3799" to-port="3" /> + <edge from-layer="3799" from-port="4" to-layer="3802" to-port="1" /> + <edge from-layer="3799" from-port="4" to-layer="3807" to-port="2" /> + <edge from-layer="3800" from-port="0" to-layer="3802" to-port="2" /> + <edge from-layer="3801" from-port="0" to-layer="3802" to-port="3" /> + <edge from-layer="3802" from-port="4" to-layer="3804" to-port="0" /> + <edge from-layer="3803" from-port="0" to-layer="3804" to-port="1" /> + <edge from-layer="3804" from-port="2" to-layer="3808" to-port="0" /> + <edge from-layer="3805" from-port="0" to-layer="3807" to-port="1" /> + <edge from-layer="3806" from-port="0" to-layer="3807" to-port="3" /> + <edge from-layer="3807" from-port="4" to-layer="3808" to-port="1" /> + <edge from-layer="3808" from-port="2" to-layer="3809" to-port="0" /> + <edge from-layer="3809" from-port="2" to-layer="3810" to-port="1" /> + <edge from-layer="3810" from-port="2" to-layer="3831" to-port="0" /> + <edge from-layer="3810" from-port="2" to-layer="3811" to-port="1" /> + <edge from-layer="3811" from-port="2" to-layer="3872" to-port="1" /> + <edge from-layer="3811" from-port="2" to-layer="7224" to-port="0" /> + <edge from-layer="3812" from-port="0" to-layer="3817" to-port="0" /> + <edge from-layer="3813" from-port="0" to-layer="3816" to-port="1" /> + <edge from-layer="3814" from-port="0" to-layer="3816" to-port="2" /> + <edge from-layer="3815" from-port="0" to-layer="3816" to-port="3" /> + <edge from-layer="3816" from-port="4" to-layer="3817" to-port="1" /> + <edge from-layer="3817" from-port="2" to-layer="3818" to-port="0" /> + <edge from-layer="3818" from-port="1" to-layer="3820" to-port="0" /> + <edge from-layer="3819" from-port="0" to-layer="3820" to-port="2" /> + <edge from-layer="3820" from-port="3" to-layer="3827" to-port="0" /> + <edge from-layer="3821" from-port="0" to-layer="3824" to-port="1" /> + <edge from-layer="3822" from-port="0" to-layer="3824" to-port="2" /> + <edge from-layer="3823" from-port="0" to-layer="3824" to-port="3" /> + <edge from-layer="3824" from-port="4" to-layer="3826" to-port="0" /> + <edge from-layer="3825" from-port="0" to-layer="3826" to-port="1" /> + <edge from-layer="3826" from-port="2" to-layer="3827" to-port="1" /> + <edge from-layer="3827" from-port="2" to-layer="3872" to-port="2" /> + <edge from-layer="3827" from-port="2" to-layer="7223" to-port="0" /> + <edge from-layer="3828" from-port="0" to-layer="3850" to-port="0" /> + <edge from-layer="3829" from-port="0" to-layer="3844" to-port="0" /> + <edge from-layer="3830" from-port="0" to-layer="3844" to-port="1" /> + <edge from-layer="3830" from-port="0" to-layer="3848" to-port="1" /> + <edge from-layer="3831" from-port="1" to-layer="3834" to-port="0" /> + <edge from-layer="3832" from-port="0" to-layer="3834" to-port="1" /> + <edge from-layer="3833" from-port="0" to-layer="3834" to-port="2" /> + <edge from-layer="3834" from-port="3" to-layer="3835" to-port="1" /> + <edge from-layer="3835" from-port="2" to-layer="3840" to-port="0" /> + <edge from-layer="3835" from-port="2" to-layer="3847" to-port="0" /> + <edge from-layer="3836" from-port="1" to-layer="3839" to-port="0" /> + <edge from-layer="3836" from-port="1" to-layer="3865" to-port="0" /> + <edge from-layer="3837" from-port="0" to-layer="3839" to-port="1" /> + <edge from-layer="3838" from-port="0" to-layer="3839" to-port="2" /> + <edge from-layer="3839" from-port="3" to-layer="3840" to-port="1" /> + <edge from-layer="3840" from-port="2" to-layer="3842" to-port="0" /> + <edge from-layer="3841" from-port="0" to-layer="3842" to-port="1" /> + <edge from-layer="3842" from-port="2" to-layer="3844" to-port="2" /> + <edge from-layer="3843" from-port="0" to-layer="3848" to-port="3" /> + <edge from-layer="3843" from-port="0" to-layer="3844" to-port="3" /> + <edge from-layer="3844" from-port="4" to-layer="3850" to-port="1" /> + <edge from-layer="3845" from-port="0" to-layer="3848" to-port="0" /> + <edge from-layer="3846" from-port="0" to-layer="3847" to-port="1" /> + <edge from-layer="3847" from-port="2" to-layer="3855" to-port="2" /> + <edge from-layer="3847" from-port="2" to-layer="3848" to-port="2" /> + <edge from-layer="3848" from-port="4" to-layer="3850" to-port="2" /> + <edge from-layer="3849" from-port="0" to-layer="3850" to-port="3" /> + <edge from-layer="3850" from-port="4" to-layer="3857" to-port="0" /> + <edge from-layer="3851" from-port="0" to-layer="3857" to-port="1" /> + <edge from-layer="3852" from-port="0" to-layer="3855" to-port="0" /> + <edge from-layer="3853" from-port="0" to-layer="3855" to-port="1" /> + <edge from-layer="3854" from-port="0" to-layer="3855" to-port="3" /> + <edge from-layer="3855" from-port="4" to-layer="3857" to-port="2" /> + <edge from-layer="3856" from-port="0" to-layer="3857" to-port="3" /> + <edge from-layer="3857" from-port="4" to-layer="3860" to-port="0" /> + <edge from-layer="3858" from-port="0" to-layer="3860" to-port="1" /> + <edge from-layer="3859" from-port="0" to-layer="3860" to-port="2" /> + <edge from-layer="3860" from-port="3" to-layer="3861" to-port="0" /> + <edge from-layer="3861" from-port="2" to-layer="3871" to-port="0" /> + <edge from-layer="3861" from-port="2" to-layer="3862" to-port="0" /> + <edge from-layer="3862" from-port="1" to-layer="3870" to-port="0" /> + <edge from-layer="3863" from-port="0" to-layer="3865" to-port="1" /> + <edge from-layer="3864" from-port="0" to-layer="3865" to-port="2" /> + <edge from-layer="3865" from-port="3" to-layer="3869" to-port="0" /> + <edge from-layer="3866" from-port="0" to-layer="3869" to-port="1" /> + <edge from-layer="3867" from-port="0" to-layer="3869" to-port="2" /> + <edge from-layer="3868" from-port="0" to-layer="3869" to-port="3" /> + <edge from-layer="3869" from-port="4" to-layer="3870" to-port="1" /> + <edge from-layer="3870" from-port="2" to-layer="3871" to-port="1" /> + <edge from-layer="3871" from-port="2" to-layer="3872" to-port="3" /> + <edge from-layer="3872" from-port="4" to-layer="3874" to-port="0" /> + <edge from-layer="3873" from-port="0" to-layer="3874" to-port="1" /> + <edge from-layer="3874" from-port="2" to-layer="3876" to-port="0" /> + <edge from-layer="3875" from-port="0" to-layer="3876" to-port="1" /> + <edge from-layer="3876" from-port="2" to-layer="3885" to-port="0" /> + <edge from-layer="3877" from-port="0" to-layer="3878" to-port="0" /> + <edge from-layer="3878" from-port="1" to-layer="3881" to-port="0" /> + <edge from-layer="3879" from-port="0" to-layer="3880" to-port="0" /> + <edge from-layer="3880" from-port="1" to-layer="3881" to-port="1" /> + <edge from-layer="3881" from-port="2" to-layer="3883" to-port="0" /> + <edge from-layer="3882" from-port="0" to-layer="3883" to-port="1" /> + <edge from-layer="3883" from-port="2" to-layer="3884" to-port="0" /> + <edge from-layer="3884" from-port="1" to-layer="3885" to-port="1" /> + <edge from-layer="3885" from-port="2" to-layer="3887" to-port="0" /> + <edge from-layer="3886" from-port="0" to-layer="3887" to-port="1" /> + <edge from-layer="3887" from-port="2" to-layer="3888" to-port="0" /> + <edge from-layer="3888" from-port="2" to-layer="3890" to-port="0" /> + <edge from-layer="3888" from-port="2" to-layer="3918" to-port="1" /> + <edge from-layer="3889" from-port="0" to-layer="3890" to-port="1" /> + <edge from-layer="3890" from-port="2" to-layer="3892" to-port="0" /> + <edge from-layer="3891" from-port="0" to-layer="3892" to-port="1" /> + <edge from-layer="3892" from-port="2" to-layer="3894" to-port="0" /> + <edge from-layer="3893" from-port="0" to-layer="3894" to-port="1" /> + <edge from-layer="3894" from-port="2" to-layer="3903" to-port="0" /> + <edge from-layer="3895" from-port="0" to-layer="3896" to-port="0" /> + <edge from-layer="3896" from-port="1" to-layer="3899" to-port="0" /> + <edge from-layer="3897" from-port="0" to-layer="3898" to-port="0" /> + <edge from-layer="3898" from-port="1" to-layer="3899" to-port="1" /> + <edge from-layer="3899" from-port="2" to-layer="3901" to-port="0" /> + <edge from-layer="3900" from-port="0" to-layer="3901" to-port="1" /> + <edge from-layer="3901" from-port="2" to-layer="3902" to-port="0" /> + <edge from-layer="3902" from-port="1" to-layer="3903" to-port="1" /> + <edge from-layer="3903" from-port="2" to-layer="3905" to-port="0" /> + <edge from-layer="3904" from-port="0" to-layer="3905" to-port="1" /> + <edge from-layer="3905" from-port="2" to-layer="3906" to-port="0" /> + <edge from-layer="3906" from-port="1" to-layer="3915" to-port="0" /> + <edge from-layer="3907" from-port="0" to-layer="3908" to-port="0" /> + <edge from-layer="3908" from-port="1" to-layer="3911" to-port="0" /> + <edge from-layer="3909" from-port="0" to-layer="3910" to-port="0" /> + <edge from-layer="3910" from-port="1" to-layer="3911" to-port="1" /> + <edge from-layer="3911" from-port="2" to-layer="3913" to-port="0" /> + <edge from-layer="3912" from-port="0" to-layer="3913" to-port="1" /> + <edge from-layer="3913" from-port="2" to-layer="3914" to-port="0" /> + <edge from-layer="3914" from-port="1" to-layer="3915" to-port="1" /> + <edge from-layer="3915" from-port="2" to-layer="3917" to-port="0" /> + <edge from-layer="3916" from-port="0" to-layer="3917" to-port="1" /> + <edge from-layer="3917" from-port="2" to-layer="3918" to-port="0" /> + <edge from-layer="3918" from-port="2" to-layer="4115" to-port="1" /> + <edge from-layer="3918" from-port="2" to-layer="3920" to-port="0" /> + <edge from-layer="3919" from-port="0" to-layer="3920" to-port="1" /> + <edge from-layer="3920" from-port="2" to-layer="3922" to-port="0" /> + <edge from-layer="3921" from-port="0" to-layer="3922" to-port="1" /> + <edge from-layer="3922" from-port="2" to-layer="3924" to-port="0" /> + <edge from-layer="3923" from-port="0" to-layer="3924" to-port="1" /> + <edge from-layer="3924" from-port="2" to-layer="3933" to-port="0" /> + <edge from-layer="3925" from-port="0" to-layer="3926" to-port="0" /> + <edge from-layer="3926" from-port="1" to-layer="3929" to-port="0" /> + <edge from-layer="3927" from-port="0" to-layer="3928" to-port="0" /> + <edge from-layer="3928" from-port="1" to-layer="3929" to-port="1" /> + <edge from-layer="3929" from-port="2" to-layer="3931" to-port="0" /> + <edge from-layer="3930" from-port="0" to-layer="3931" to-port="1" /> + <edge from-layer="3931" from-port="2" to-layer="3932" to-port="0" /> + <edge from-layer="3932" from-port="1" to-layer="3933" to-port="1" /> + <edge from-layer="3933" from-port="2" to-layer="3935" to-port="0" /> + <edge from-layer="3934" from-port="0" to-layer="3935" to-port="1" /> + <edge from-layer="3935" from-port="2" to-layer="3937" to-port="0" /> + <edge from-layer="3936" from-port="0" to-layer="3937" to-port="1" /> + <edge from-layer="3937" from-port="2" to-layer="4051" to-port="0" /> + <edge from-layer="3937" from-port="2" to-layer="3953" to-port="0" /> + <edge from-layer="3937" from-port="2" to-layer="3941" to-port="0" /> + <edge from-layer="3938" from-port="0" to-layer="3941" to-port="1" /> + <edge from-layer="3939" from-port="0" to-layer="3941" to-port="2" /> + <edge from-layer="3940" from-port="0" to-layer="3941" to-port="3" /> + <edge from-layer="3941" from-port="4" to-layer="3943" to-port="0" /> + <edge from-layer="3942" from-port="0" to-layer="3943" to-port="1" /> + <edge from-layer="3943" from-port="2" to-layer="3947" to-port="0" /> + <edge from-layer="3944" from-port="0" to-layer="3947" to-port="1" /> + <edge from-layer="3945" from-port="0" to-layer="3947" to-port="2" /> + <edge from-layer="3946" from-port="0" to-layer="3947" to-port="3" /> + <edge from-layer="3947" from-port="4" to-layer="3979" to-port="0" /> + <edge from-layer="3947" from-port="4" to-layer="3993" to-port="0" /> + <edge from-layer="3947" from-port="4" to-layer="3998" to-port="0" /> + <edge from-layer="3947" from-port="4" to-layer="3982" to-port="0" /> + <edge from-layer="3948" from-port="0" to-layer="3975" to-port="0" /> + <edge from-layer="3949" from-port="0" to-layer="3975" to-port="1" /> + <edge from-layer="3950" from-port="0" to-layer="3953" to-port="1" /> + <edge from-layer="3951" from-port="0" to-layer="3953" to-port="2" /> + <edge from-layer="3952" from-port="0" to-layer="3953" to-port="3" /> + <edge from-layer="3953" from-port="4" to-layer="4010" to-port="0" /> + <edge from-layer="3953" from-port="4" to-layer="3954" to-port="0" /> + <edge from-layer="3954" from-port="1" to-layer="3957" to-port="0" /> + <edge from-layer="3955" from-port="0" to-layer="3957" to-port="1" /> + <edge from-layer="3956" from-port="0" to-layer="3957" to-port="2" /> + <edge from-layer="3957" from-port="3" to-layer="3973" to-port="0" /> + <edge from-layer="3958" from-port="0" to-layer="3963" to-port="0" /> + <edge from-layer="3959" from-port="0" to-layer="3962" to-port="1" /> + <edge from-layer="3960" from-port="0" to-layer="3962" to-port="2" /> + <edge from-layer="3961" from-port="0" to-layer="3962" to-port="3" /> + <edge from-layer="3962" from-port="4" to-layer="3963" to-port="1" /> + <edge from-layer="3963" from-port="2" to-layer="3964" to-port="0" /> + <edge from-layer="3964" from-port="1" to-layer="3966" to-port="0" /> + <edge from-layer="3965" from-port="0" to-layer="3966" to-port="2" /> + <edge from-layer="3966" from-port="3" to-layer="3967" to-port="0" /> + <edge from-layer="3966" from-port="3" to-layer="4038" to-port="0" /> + <edge from-layer="3967" from-port="1" to-layer="3970" to-port="0" /> + <edge from-layer="3968" from-port="0" to-layer="3970" to-port="1" /> + <edge from-layer="3969" from-port="0" to-layer="3970" to-port="2" /> + <edge from-layer="3970" from-port="3" to-layer="3972" to-port="0" /> + <edge from-layer="3970" from-port="3" to-layer="4062" to-port="0" /> + <edge from-layer="3971" from-port="0" to-layer="3972" to-port="1" /> + <edge from-layer="3972" from-port="2" to-layer="3973" to-port="1" /> + <edge from-layer="3973" from-port="2" to-layer="4003" to-port="2" /> + <edge from-layer="3973" from-port="2" to-layer="3975" to-port="2" /> + <edge from-layer="3974" from-port="0" to-layer="3975" to-port="3" /> + <edge from-layer="3975" from-port="4" to-layer="3977" to-port="0" /> + <edge from-layer="3976" from-port="0" to-layer="3977" to-port="2" /> + <edge from-layer="3977" from-port="3" to-layer="3978" to-port="0" /> + <edge from-layer="3978" from-port="2" to-layer="4015" to-port="1" /> + <edge from-layer="3978" from-port="2" to-layer="3979" to-port="1" /> + <edge from-layer="3979" from-port="2" to-layer="4008" to-port="0" /> + <edge from-layer="3980" from-port="0" to-layer="3990" to-port="0" /> + <edge from-layer="3981" from-port="0" to-layer="3990" to-port="1" /> + <edge from-layer="3982" from-port="1" to-layer="3984" to-port="0" /> + <edge from-layer="3983" from-port="0" to-layer="3984" to-port="2" /> + <edge from-layer="3984" from-port="3" to-layer="3985" to-port="0" /> + <edge from-layer="3985" from-port="2" to-layer="3986" to-port="0" /> + <edge from-layer="3986" from-port="1" to-layer="3988" to-port="0" /> + <edge from-layer="3987" from-port="0" to-layer="3988" to-port="1" /> + <edge from-layer="3988" from-port="2" to-layer="3990" to-port="2" /> + <edge from-layer="3989" from-port="0" to-layer="3990" to-port="3" /> + <edge from-layer="3990" from-port="4" to-layer="3993" to-port="1" /> + <edge from-layer="3990" from-port="4" to-layer="3998" to-port="2" /> + <edge from-layer="3991" from-port="0" to-layer="3993" to-port="2" /> + <edge from-layer="3992" from-port="0" to-layer="3993" to-port="3" /> + <edge from-layer="3993" from-port="4" to-layer="3995" to-port="0" /> + <edge from-layer="3994" from-port="0" to-layer="3995" to-port="1" /> + <edge from-layer="3995" from-port="2" to-layer="3999" to-port="0" /> + <edge from-layer="3996" from-port="0" to-layer="3998" to-port="1" /> + <edge from-layer="3997" from-port="0" to-layer="3998" to-port="3" /> + <edge from-layer="3998" from-port="4" to-layer="3999" to-port="1" /> + <edge from-layer="3999" from-port="2" to-layer="4007" to-port="0" /> + <edge from-layer="4000" from-port="0" to-layer="4003" to-port="0" /> + <edge from-layer="4001" from-port="0" to-layer="4003" to-port="1" /> + <edge from-layer="4002" from-port="0" to-layer="4003" to-port="3" /> + <edge from-layer="4003" from-port="4" to-layer="4005" to-port="0" /> + <edge from-layer="4004" from-port="0" to-layer="4005" to-port="2" /> + <edge from-layer="4005" from-port="3" to-layer="4006" to-port="0" /> + <edge from-layer="4006" from-port="2" to-layer="4007" to-port="1" /> + <edge from-layer="4006" from-port="2" to-layer="4036" to-port="1" /> + <edge from-layer="4007" from-port="2" to-layer="4008" to-port="1" /> + <edge from-layer="4008" from-port="2" to-layer="4099" to-port="0" /> + <edge from-layer="4008" from-port="2" to-layer="4063" to-port="0" /> + <edge from-layer="4009" from-port="0" to-layer="4010" to-port="1" /> + <edge from-layer="4010" from-port="2" to-layer="4014" to-port="0" /> + <edge from-layer="4011" from-port="0" to-layer="4014" to-port="1" /> + <edge from-layer="4012" from-port="0" to-layer="4014" to-port="2" /> + <edge from-layer="4013" from-port="0" to-layer="4014" to-port="3" /> + <edge from-layer="4014" from-port="4" to-layer="4034" to-port="0" /> + <edge from-layer="4014" from-port="4" to-layer="4015" to-port="0" /> + <edge from-layer="4014" from-port="4" to-layer="4029" to-port="0" /> + <edge from-layer="4014" from-port="4" to-layer="4018" to-port="0" /> + <edge from-layer="4015" from-port="2" to-layer="4037" to-port="0" /> + <edge from-layer="4016" from-port="0" to-layer="4026" to-port="0" /> + <edge from-layer="4017" from-port="0" to-layer="4026" to-port="1" /> + <edge from-layer="4018" from-port="1" to-layer="4020" to-port="0" /> + <edge from-layer="4019" from-port="0" to-layer="4020" to-port="2" /> + <edge from-layer="4020" from-port="3" to-layer="4021" to-port="0" /> + <edge from-layer="4021" from-port="2" to-layer="4022" to-port="0" /> + <edge from-layer="4022" from-port="1" to-layer="4024" to-port="0" /> + <edge from-layer="4023" from-port="0" to-layer="4024" to-port="1" /> + <edge from-layer="4024" from-port="2" to-layer="4026" to-port="2" /> + <edge from-layer="4025" from-port="0" to-layer="4026" to-port="3" /> + <edge from-layer="4026" from-port="4" to-layer="4034" to-port="2" /> + <edge from-layer="4026" from-port="4" to-layer="4029" to-port="1" /> + <edge from-layer="4027" from-port="0" to-layer="4029" to-port="2" /> + <edge from-layer="4028" from-port="0" to-layer="4029" to-port="3" /> + <edge from-layer="4029" from-port="4" to-layer="4031" to-port="0" /> + <edge from-layer="4030" from-port="0" to-layer="4031" to-port="1" /> + <edge from-layer="4031" from-port="2" to-layer="4035" to-port="0" /> + <edge from-layer="4032" from-port="0" to-layer="4034" to-port="1" /> + <edge from-layer="4033" from-port="0" to-layer="4034" to-port="3" /> + <edge from-layer="4034" from-port="4" to-layer="4035" to-port="1" /> + <edge from-layer="4035" from-port="2" to-layer="4036" to-port="0" /> + <edge from-layer="4036" from-port="2" to-layer="4037" to-port="1" /> + <edge from-layer="4037" from-port="2" to-layer="4058" to-port="0" /> + <edge from-layer="4037" from-port="2" to-layer="4038" to-port="1" /> + <edge from-layer="4038" from-port="2" to-layer="7222" to-port="0" /> + <edge from-layer="4038" from-port="2" to-layer="4099" to-port="1" /> + <edge from-layer="4039" from-port="0" to-layer="4044" to-port="0" /> + <edge from-layer="4040" from-port="0" to-layer="4043" to-port="1" /> + <edge from-layer="4041" from-port="0" to-layer="4043" to-port="2" /> + <edge from-layer="4042" from-port="0" to-layer="4043" to-port="3" /> + <edge from-layer="4043" from-port="4" to-layer="4044" to-port="1" /> + <edge from-layer="4044" from-port="2" to-layer="4045" to-port="0" /> + <edge from-layer="4045" from-port="1" to-layer="4047" to-port="0" /> + <edge from-layer="4046" from-port="0" to-layer="4047" to-port="2" /> + <edge from-layer="4047" from-port="3" to-layer="4054" to-port="0" /> + <edge from-layer="4048" from-port="0" to-layer="4051" to-port="1" /> + <edge from-layer="4049" from-port="0" to-layer="4051" to-port="2" /> + <edge from-layer="4050" from-port="0" to-layer="4051" to-port="3" /> + <edge from-layer="4051" from-port="4" to-layer="4053" to-port="0" /> + <edge from-layer="4052" from-port="0" to-layer="4053" to-port="1" /> + <edge from-layer="4053" from-port="2" to-layer="4054" to-port="1" /> + <edge from-layer="4054" from-port="2" to-layer="4099" to-port="2" /> + <edge from-layer="4054" from-port="2" to-layer="7221" to-port="0" /> + <edge from-layer="4055" from-port="0" to-layer="4077" to-port="0" /> + <edge from-layer="4056" from-port="0" to-layer="4071" to-port="0" /> + <edge from-layer="4057" from-port="0" to-layer="4075" to-port="1" /> + <edge from-layer="4057" from-port="0" to-layer="4071" to-port="1" /> + <edge from-layer="4058" from-port="1" to-layer="4061" to-port="0" /> + <edge from-layer="4059" from-port="0" to-layer="4061" to-port="1" /> + <edge from-layer="4060" from-port="0" to-layer="4061" to-port="2" /> + <edge from-layer="4061" from-port="3" to-layer="4062" to-port="1" /> + <edge from-layer="4062" from-port="2" to-layer="4067" to-port="0" /> + <edge from-layer="4062" from-port="2" to-layer="4074" to-port="0" /> + <edge from-layer="4063" from-port="1" to-layer="4092" to-port="0" /> + <edge from-layer="4063" from-port="1" to-layer="4066" to-port="0" /> + <edge from-layer="4064" from-port="0" to-layer="4066" to-port="1" /> + <edge from-layer="4065" from-port="0" to-layer="4066" to-port="2" /> + <edge from-layer="4066" from-port="3" to-layer="4067" to-port="1" /> + <edge from-layer="4067" from-port="2" to-layer="4069" to-port="0" /> + <edge from-layer="4068" from-port="0" to-layer="4069" to-port="1" /> + <edge from-layer="4069" from-port="2" to-layer="4071" to-port="2" /> + <edge from-layer="4070" from-port="0" to-layer="4075" to-port="3" /> + <edge from-layer="4070" from-port="0" to-layer="4071" to-port="3" /> + <edge from-layer="4071" from-port="4" to-layer="4077" to-port="1" /> + <edge from-layer="4072" from-port="0" to-layer="4075" to-port="0" /> + <edge from-layer="4073" from-port="0" to-layer="4074" to-port="1" /> + <edge from-layer="4074" from-port="2" to-layer="4082" to-port="2" /> + <edge from-layer="4074" from-port="2" to-layer="4075" to-port="2" /> + <edge from-layer="4075" from-port="4" to-layer="4077" to-port="2" /> + <edge from-layer="4076" from-port="0" to-layer="4077" to-port="3" /> + <edge from-layer="4077" from-port="4" to-layer="4084" to-port="0" /> + <edge from-layer="4078" from-port="0" to-layer="4084" to-port="1" /> + <edge from-layer="4079" from-port="0" to-layer="4082" to-port="0" /> + <edge from-layer="4080" from-port="0" to-layer="4082" to-port="1" /> + <edge from-layer="4081" from-port="0" to-layer="4082" to-port="3" /> + <edge from-layer="4082" from-port="4" to-layer="4084" to-port="2" /> + <edge from-layer="4083" from-port="0" to-layer="4084" to-port="3" /> + <edge from-layer="4084" from-port="4" to-layer="4087" to-port="0" /> + <edge from-layer="4085" from-port="0" to-layer="4087" to-port="1" /> + <edge from-layer="4086" from-port="0" to-layer="4087" to-port="2" /> + <edge from-layer="4087" from-port="3" to-layer="4088" to-port="0" /> + <edge from-layer="4088" from-port="2" to-layer="4089" to-port="0" /> + <edge from-layer="4088" from-port="2" to-layer="4098" to-port="0" /> + <edge from-layer="4089" from-port="1" to-layer="4097" to-port="0" /> + <edge from-layer="4090" from-port="0" to-layer="4092" to-port="1" /> + <edge from-layer="4091" from-port="0" to-layer="4092" to-port="2" /> + <edge from-layer="4092" from-port="3" to-layer="4096" to-port="0" /> + <edge from-layer="4093" from-port="0" to-layer="4096" to-port="1" /> + <edge from-layer="4094" from-port="0" to-layer="4096" to-port="2" /> + <edge from-layer="4095" from-port="0" to-layer="4096" to-port="3" /> + <edge from-layer="4096" from-port="4" to-layer="4097" to-port="1" /> + <edge from-layer="4097" from-port="2" to-layer="4098" to-port="1" /> + <edge from-layer="4098" from-port="2" to-layer="4099" to-port="3" /> + <edge from-layer="4099" from-port="4" to-layer="4101" to-port="0" /> + <edge from-layer="4100" from-port="0" to-layer="4101" to-port="1" /> + <edge from-layer="4101" from-port="2" to-layer="4103" to-port="0" /> + <edge from-layer="4102" from-port="0" to-layer="4103" to-port="1" /> + <edge from-layer="4103" from-port="2" to-layer="4112" to-port="0" /> + <edge from-layer="4104" from-port="0" to-layer="4105" to-port="0" /> + <edge from-layer="4105" from-port="1" to-layer="4108" to-port="0" /> + <edge from-layer="4106" from-port="0" to-layer="4107" to-port="0" /> + <edge from-layer="4107" from-port="1" to-layer="4108" to-port="1" /> + <edge from-layer="4108" from-port="2" to-layer="4110" to-port="0" /> + <edge from-layer="4109" from-port="0" to-layer="4110" to-port="1" /> + <edge from-layer="4110" from-port="2" to-layer="4111" to-port="0" /> + <edge from-layer="4111" from-port="1" to-layer="4112" to-port="1" /> + <edge from-layer="4112" from-port="2" to-layer="4114" to-port="0" /> + <edge from-layer="4113" from-port="0" to-layer="4114" to-port="1" /> + <edge from-layer="4114" from-port="2" to-layer="4115" to-port="0" /> + <edge from-layer="4115" from-port="2" to-layer="4145" to-port="1" /> + <edge from-layer="4115" from-port="2" to-layer="4117" to-port="0" /> + <edge from-layer="4116" from-port="0" to-layer="4117" to-port="1" /> + <edge from-layer="4117" from-port="2" to-layer="4119" to-port="0" /> + <edge from-layer="4118" from-port="0" to-layer="4119" to-port="1" /> + <edge from-layer="4119" from-port="2" to-layer="4121" to-port="0" /> + <edge from-layer="4120" from-port="0" to-layer="4121" to-port="1" /> + <edge from-layer="4121" from-port="2" to-layer="4130" to-port="0" /> + <edge from-layer="4122" from-port="0" to-layer="4123" to-port="0" /> + <edge from-layer="4123" from-port="1" to-layer="4126" to-port="0" /> + <edge from-layer="4124" from-port="0" to-layer="4125" to-port="0" /> + <edge from-layer="4125" from-port="1" to-layer="4126" to-port="1" /> + <edge from-layer="4126" from-port="2" to-layer="4128" to-port="0" /> + <edge from-layer="4127" from-port="0" to-layer="4128" to-port="1" /> + <edge from-layer="4128" from-port="2" to-layer="4129" to-port="0" /> + <edge from-layer="4129" from-port="1" to-layer="4130" to-port="1" /> + <edge from-layer="4130" from-port="2" to-layer="4132" to-port="0" /> + <edge from-layer="4131" from-port="0" to-layer="4132" to-port="1" /> + <edge from-layer="4132" from-port="2" to-layer="4133" to-port="0" /> + <edge from-layer="4133" from-port="1" to-layer="4142" to-port="0" /> + <edge from-layer="4134" from-port="0" to-layer="4135" to-port="0" /> + <edge from-layer="4135" from-port="1" to-layer="4138" to-port="0" /> + <edge from-layer="4136" from-port="0" to-layer="4137" to-port="0" /> + <edge from-layer="4137" from-port="1" to-layer="4138" to-port="1" /> + <edge from-layer="4138" from-port="2" to-layer="4140" to-port="0" /> + <edge from-layer="4139" from-port="0" to-layer="4140" to-port="1" /> + <edge from-layer="4140" from-port="2" to-layer="4141" to-port="0" /> + <edge from-layer="4141" from-port="1" to-layer="4142" to-port="1" /> + <edge from-layer="4142" from-port="2" to-layer="4144" to-port="0" /> + <edge from-layer="4143" from-port="0" to-layer="4144" to-port="1" /> + <edge from-layer="4144" from-port="2" to-layer="4145" to-port="0" /> + <edge from-layer="4145" from-port="2" to-layer="4147" to-port="0" /> + <edge from-layer="4145" from-port="2" to-layer="4342" to-port="1" /> + <edge from-layer="4146" from-port="0" to-layer="4147" to-port="1" /> + <edge from-layer="4147" from-port="2" to-layer="4149" to-port="0" /> + <edge from-layer="4148" from-port="0" to-layer="4149" to-port="1" /> + <edge from-layer="4149" from-port="2" to-layer="4151" to-port="0" /> + <edge from-layer="4150" from-port="0" to-layer="4151" to-port="1" /> + <edge from-layer="4151" from-port="2" to-layer="4160" to-port="0" /> + <edge from-layer="4152" from-port="0" to-layer="4153" to-port="0" /> + <edge from-layer="4153" from-port="1" to-layer="4156" to-port="0" /> + <edge from-layer="4154" from-port="0" to-layer="4155" to-port="0" /> + <edge from-layer="4155" from-port="1" to-layer="4156" to-port="1" /> + <edge from-layer="4156" from-port="2" to-layer="4158" to-port="0" /> + <edge from-layer="4157" from-port="0" to-layer="4158" to-port="1" /> + <edge from-layer="4158" from-port="2" to-layer="4159" to-port="0" /> + <edge from-layer="4159" from-port="1" to-layer="4160" to-port="1" /> + <edge from-layer="4160" from-port="2" to-layer="4162" to-port="0" /> + <edge from-layer="4161" from-port="0" to-layer="4162" to-port="1" /> + <edge from-layer="4162" from-port="2" to-layer="4164" to-port="0" /> + <edge from-layer="4163" from-port="0" to-layer="4164" to-port="1" /> + <edge from-layer="4164" from-port="2" to-layer="4168" to-port="0" /> + <edge from-layer="4164" from-port="2" to-layer="4278" to-port="0" /> + <edge from-layer="4164" from-port="2" to-layer="4180" to-port="0" /> + <edge from-layer="4165" from-port="0" to-layer="4168" to-port="1" /> + <edge from-layer="4166" from-port="0" to-layer="4168" to-port="2" /> + <edge from-layer="4167" from-port="0" to-layer="4168" to-port="3" /> + <edge from-layer="4168" from-port="4" to-layer="4170" to-port="0" /> + <edge from-layer="4169" from-port="0" to-layer="4170" to-port="1" /> + <edge from-layer="4170" from-port="2" to-layer="4174" to-port="0" /> + <edge from-layer="4171" from-port="0" to-layer="4174" to-port="1" /> + <edge from-layer="4172" from-port="0" to-layer="4174" to-port="2" /> + <edge from-layer="4173" from-port="0" to-layer="4174" to-port="3" /> + <edge from-layer="4174" from-port="4" to-layer="4220" to-port="0" /> + <edge from-layer="4174" from-port="4" to-layer="4225" to-port="0" /> + <edge from-layer="4174" from-port="4" to-layer="4209" to-port="0" /> + <edge from-layer="4174" from-port="4" to-layer="4206" to-port="0" /> + <edge from-layer="4175" from-port="0" to-layer="4202" to-port="0" /> + <edge from-layer="4176" from-port="0" to-layer="4202" to-port="1" /> + <edge from-layer="4177" from-port="0" to-layer="4180" to-port="1" /> + <edge from-layer="4178" from-port="0" to-layer="4180" to-port="2" /> + <edge from-layer="4179" from-port="0" to-layer="4180" to-port="3" /> + <edge from-layer="4180" from-port="4" to-layer="4181" to-port="0" /> + <edge from-layer="4180" from-port="4" to-layer="4237" to-port="0" /> + <edge from-layer="4181" from-port="1" to-layer="4184" to-port="0" /> + <edge from-layer="4182" from-port="0" to-layer="4184" to-port="1" /> + <edge from-layer="4183" from-port="0" to-layer="4184" to-port="2" /> + <edge from-layer="4184" from-port="3" to-layer="4200" to-port="0" /> + <edge from-layer="4185" from-port="0" to-layer="4190" to-port="0" /> + <edge from-layer="4186" from-port="0" to-layer="4189" to-port="1" /> + <edge from-layer="4187" from-port="0" to-layer="4189" to-port="2" /> + <edge from-layer="4188" from-port="0" to-layer="4189" to-port="3" /> + <edge from-layer="4189" from-port="4" to-layer="4190" to-port="1" /> + <edge from-layer="4190" from-port="2" to-layer="4191" to-port="0" /> + <edge from-layer="4191" from-port="1" to-layer="4193" to-port="0" /> + <edge from-layer="4192" from-port="0" to-layer="4193" to-port="2" /> + <edge from-layer="4193" from-port="3" to-layer="4265" to-port="0" /> + <edge from-layer="4193" from-port="3" to-layer="4194" to-port="0" /> + <edge from-layer="4194" from-port="1" to-layer="4197" to-port="0" /> + <edge from-layer="4195" from-port="0" to-layer="4197" to-port="1" /> + <edge from-layer="4196" from-port="0" to-layer="4197" to-port="2" /> + <edge from-layer="4197" from-port="3" to-layer="4199" to-port="0" /> + <edge from-layer="4197" from-port="3" to-layer="4289" to-port="0" /> + <edge from-layer="4198" from-port="0" to-layer="4199" to-port="1" /> + <edge from-layer="4199" from-port="2" to-layer="4200" to-port="1" /> + <edge from-layer="4200" from-port="2" to-layer="4230" to-port="2" /> + <edge from-layer="4200" from-port="2" to-layer="4202" to-port="2" /> + <edge from-layer="4201" from-port="0" to-layer="4202" to-port="3" /> + <edge from-layer="4202" from-port="4" to-layer="4204" to-port="0" /> + <edge from-layer="4203" from-port="0" to-layer="4204" to-port="2" /> + <edge from-layer="4204" from-port="3" to-layer="4205" to-port="0" /> + <edge from-layer="4205" from-port="2" to-layer="4206" to-port="1" /> + <edge from-layer="4205" from-port="2" to-layer="4242" to-port="1" /> + <edge from-layer="4206" from-port="2" to-layer="4235" to-port="0" /> + <edge from-layer="4207" from-port="0" to-layer="4217" to-port="0" /> + <edge from-layer="4208" from-port="0" to-layer="4217" to-port="1" /> + <edge from-layer="4209" from-port="1" to-layer="4211" to-port="0" /> + <edge from-layer="4210" from-port="0" to-layer="4211" to-port="2" /> + <edge from-layer="4211" from-port="3" to-layer="4212" to-port="0" /> + <edge from-layer="4212" from-port="2" to-layer="4213" to-port="0" /> + <edge from-layer="4213" from-port="1" to-layer="4215" to-port="0" /> + <edge from-layer="4214" from-port="0" to-layer="4215" to-port="1" /> + <edge from-layer="4215" from-port="2" to-layer="4217" to-port="2" /> + <edge from-layer="4216" from-port="0" to-layer="4217" to-port="3" /> + <edge from-layer="4217" from-port="4" to-layer="4225" to-port="2" /> + <edge from-layer="4217" from-port="4" to-layer="4220" to-port="1" /> + <edge from-layer="4218" from-port="0" to-layer="4220" to-port="2" /> + <edge from-layer="4219" from-port="0" to-layer="4220" to-port="3" /> + <edge from-layer="4220" from-port="4" to-layer="4222" to-port="0" /> + <edge from-layer="4221" from-port="0" to-layer="4222" to-port="1" /> + <edge from-layer="4222" from-port="2" to-layer="4226" to-port="0" /> + <edge from-layer="4223" from-port="0" to-layer="4225" to-port="1" /> + <edge from-layer="4224" from-port="0" to-layer="4225" to-port="3" /> + <edge from-layer="4225" from-port="4" to-layer="4226" to-port="1" /> + <edge from-layer="4226" from-port="2" to-layer="4234" to-port="0" /> + <edge from-layer="4227" from-port="0" to-layer="4230" to-port="0" /> + <edge from-layer="4228" from-port="0" to-layer="4230" to-port="1" /> + <edge from-layer="4229" from-port="0" to-layer="4230" to-port="3" /> + <edge from-layer="4230" from-port="4" to-layer="4232" to-port="0" /> + <edge from-layer="4231" from-port="0" to-layer="4232" to-port="2" /> + <edge from-layer="4232" from-port="3" to-layer="4233" to-port="0" /> + <edge from-layer="4233" from-port="2" to-layer="4234" to-port="1" /> + <edge from-layer="4233" from-port="2" to-layer="4263" to-port="1" /> + <edge from-layer="4234" from-port="2" to-layer="4235" to-port="1" /> + <edge from-layer="4235" from-port="2" to-layer="4290" to-port="0" /> + <edge from-layer="4235" from-port="2" to-layer="4326" to-port="0" /> + <edge from-layer="4236" from-port="0" to-layer="4237" to-port="1" /> + <edge from-layer="4237" from-port="2" to-layer="4241" to-port="0" /> + <edge from-layer="4238" from-port="0" to-layer="4241" to-port="1" /> + <edge from-layer="4239" from-port="0" to-layer="4241" to-port="2" /> + <edge from-layer="4240" from-port="0" to-layer="4241" to-port="3" /> + <edge from-layer="4241" from-port="4" to-layer="4242" to-port="0" /> + <edge from-layer="4241" from-port="4" to-layer="4256" to-port="0" /> + <edge from-layer="4241" from-port="4" to-layer="4261" to-port="0" /> + <edge from-layer="4241" from-port="4" to-layer="4245" to-port="0" /> + <edge from-layer="4242" from-port="2" to-layer="4264" to-port="0" /> + <edge from-layer="4243" from-port="0" to-layer="4253" to-port="0" /> + <edge from-layer="4244" from-port="0" to-layer="4253" to-port="1" /> + <edge from-layer="4245" from-port="1" to-layer="4247" to-port="0" /> + <edge from-layer="4246" from-port="0" to-layer="4247" to-port="2" /> + <edge from-layer="4247" from-port="3" to-layer="4248" to-port="0" /> + <edge from-layer="4248" from-port="2" to-layer="4249" to-port="0" /> + <edge from-layer="4249" from-port="1" to-layer="4251" to-port="0" /> + <edge from-layer="4250" from-port="0" to-layer="4251" to-port="1" /> + <edge from-layer="4251" from-port="2" to-layer="4253" to-port="2" /> + <edge from-layer="4252" from-port="0" to-layer="4253" to-port="3" /> + <edge from-layer="4253" from-port="4" to-layer="4256" to-port="1" /> + <edge from-layer="4253" from-port="4" to-layer="4261" to-port="2" /> + <edge from-layer="4254" from-port="0" to-layer="4256" to-port="2" /> + <edge from-layer="4255" from-port="0" to-layer="4256" to-port="3" /> + <edge from-layer="4256" from-port="4" to-layer="4258" to-port="0" /> + <edge from-layer="4257" from-port="0" to-layer="4258" to-port="1" /> + <edge from-layer="4258" from-port="2" to-layer="4262" to-port="0" /> + <edge from-layer="4259" from-port="0" to-layer="4261" to-port="1" /> + <edge from-layer="4260" from-port="0" to-layer="4261" to-port="3" /> + <edge from-layer="4261" from-port="4" to-layer="4262" to-port="1" /> + <edge from-layer="4262" from-port="2" to-layer="4263" to-port="0" /> + <edge from-layer="4263" from-port="2" to-layer="4264" to-port="1" /> + <edge from-layer="4264" from-port="2" to-layer="4265" to-port="1" /> + <edge from-layer="4264" from-port="2" to-layer="4285" to-port="0" /> + <edge from-layer="4265" from-port="2" to-layer="4326" to-port="1" /> + <edge from-layer="4265" from-port="2" to-layer="7220" to-port="0" /> + <edge from-layer="4266" from-port="0" to-layer="4271" to-port="0" /> + <edge from-layer="4267" from-port="0" to-layer="4270" to-port="1" /> + <edge from-layer="4268" from-port="0" to-layer="4270" to-port="2" /> + <edge from-layer="4269" from-port="0" to-layer="4270" to-port="3" /> + <edge from-layer="4270" from-port="4" to-layer="4271" to-port="1" /> + <edge from-layer="4271" from-port="2" to-layer="4272" to-port="0" /> + <edge from-layer="4272" from-port="1" to-layer="4274" to-port="0" /> + <edge from-layer="4273" from-port="0" to-layer="4274" to-port="2" /> + <edge from-layer="4274" from-port="3" to-layer="4281" to-port="0" /> + <edge from-layer="4275" from-port="0" to-layer="4278" to-port="1" /> + <edge from-layer="4276" from-port="0" to-layer="4278" to-port="2" /> + <edge from-layer="4277" from-port="0" to-layer="4278" to-port="3" /> + <edge from-layer="4278" from-port="4" to-layer="4280" to-port="0" /> + <edge from-layer="4279" from-port="0" to-layer="4280" to-port="1" /> + <edge from-layer="4280" from-port="2" to-layer="4281" to-port="1" /> + <edge from-layer="4281" from-port="2" to-layer="7219" to-port="0" /> + <edge from-layer="4281" from-port="2" to-layer="4326" to-port="2" /> + <edge from-layer="4282" from-port="0" to-layer="4304" to-port="0" /> + <edge from-layer="4283" from-port="0" to-layer="4298" to-port="0" /> + <edge from-layer="4284" from-port="0" to-layer="4302" to-port="1" /> + <edge from-layer="4284" from-port="0" to-layer="4298" to-port="1" /> + <edge from-layer="4285" from-port="1" to-layer="4288" to-port="0" /> + <edge from-layer="4286" from-port="0" to-layer="4288" to-port="1" /> + <edge from-layer="4287" from-port="0" to-layer="4288" to-port="2" /> + <edge from-layer="4288" from-port="3" to-layer="4289" to-port="1" /> + <edge from-layer="4289" from-port="2" to-layer="4294" to-port="0" /> + <edge from-layer="4289" from-port="2" to-layer="4301" to-port="0" /> + <edge from-layer="4290" from-port="1" to-layer="4293" to-port="0" /> + <edge from-layer="4290" from-port="1" to-layer="4319" to-port="0" /> + <edge from-layer="4291" from-port="0" to-layer="4293" to-port="1" /> + <edge from-layer="4292" from-port="0" to-layer="4293" to-port="2" /> + <edge from-layer="4293" from-port="3" to-layer="4294" to-port="1" /> + <edge from-layer="4294" from-port="2" to-layer="4296" to-port="0" /> + <edge from-layer="4295" from-port="0" to-layer="4296" to-port="1" /> + <edge from-layer="4296" from-port="2" to-layer="4298" to-port="2" /> + <edge from-layer="4297" from-port="0" to-layer="4298" to-port="3" /> + <edge from-layer="4297" from-port="0" to-layer="4302" to-port="3" /> + <edge from-layer="4298" from-port="4" to-layer="4304" to-port="1" /> + <edge from-layer="4299" from-port="0" to-layer="4302" to-port="0" /> + <edge from-layer="4300" from-port="0" to-layer="4301" to-port="1" /> + <edge from-layer="4301" from-port="2" to-layer="4309" to-port="2" /> + <edge from-layer="4301" from-port="2" to-layer="4302" to-port="2" /> + <edge from-layer="4302" from-port="4" to-layer="4304" to-port="2" /> + <edge from-layer="4303" from-port="0" to-layer="4304" to-port="3" /> + <edge from-layer="4304" from-port="4" to-layer="4311" to-port="0" /> + <edge from-layer="4305" from-port="0" to-layer="4311" to-port="1" /> + <edge from-layer="4306" from-port="0" to-layer="4309" to-port="0" /> + <edge from-layer="4307" from-port="0" to-layer="4309" to-port="1" /> + <edge from-layer="4308" from-port="0" to-layer="4309" to-port="3" /> + <edge from-layer="4309" from-port="4" to-layer="4311" to-port="2" /> + <edge from-layer="4310" from-port="0" to-layer="4311" to-port="3" /> + <edge from-layer="4311" from-port="4" to-layer="4314" to-port="0" /> + <edge from-layer="4312" from-port="0" to-layer="4314" to-port="1" /> + <edge from-layer="4313" from-port="0" to-layer="4314" to-port="2" /> + <edge from-layer="4314" from-port="3" to-layer="4315" to-port="0" /> + <edge from-layer="4315" from-port="2" to-layer="4316" to-port="0" /> + <edge from-layer="4315" from-port="2" to-layer="4325" to-port="0" /> + <edge from-layer="4316" from-port="1" to-layer="4324" to-port="0" /> + <edge from-layer="4317" from-port="0" to-layer="4319" to-port="1" /> + <edge from-layer="4318" from-port="0" to-layer="4319" to-port="2" /> + <edge from-layer="4319" from-port="3" to-layer="4323" to-port="0" /> + <edge from-layer="4320" from-port="0" to-layer="4323" to-port="1" /> + <edge from-layer="4321" from-port="0" to-layer="4323" to-port="2" /> + <edge from-layer="4322" from-port="0" to-layer="4323" to-port="3" /> + <edge from-layer="4323" from-port="4" to-layer="4324" to-port="1" /> + <edge from-layer="4324" from-port="2" to-layer="4325" to-port="1" /> + <edge from-layer="4325" from-port="2" to-layer="4326" to-port="3" /> + <edge from-layer="4326" from-port="4" to-layer="4328" to-port="0" /> + <edge from-layer="4327" from-port="0" to-layer="4328" to-port="1" /> + <edge from-layer="4328" from-port="2" to-layer="4330" to-port="0" /> + <edge from-layer="4329" from-port="0" to-layer="4330" to-port="1" /> + <edge from-layer="4330" from-port="2" to-layer="4339" to-port="0" /> + <edge from-layer="4331" from-port="0" to-layer="4332" to-port="0" /> + <edge from-layer="4332" from-port="1" to-layer="4335" to-port="0" /> + <edge from-layer="4333" from-port="0" to-layer="4334" to-port="0" /> + <edge from-layer="4334" from-port="1" to-layer="4335" to-port="1" /> + <edge from-layer="4335" from-port="2" to-layer="4337" to-port="0" /> + <edge from-layer="4336" from-port="0" to-layer="4337" to-port="1" /> + <edge from-layer="4337" from-port="2" to-layer="4338" to-port="0" /> + <edge from-layer="4338" from-port="1" to-layer="4339" to-port="1" /> + <edge from-layer="4339" from-port="2" to-layer="4341" to-port="0" /> + <edge from-layer="4340" from-port="0" to-layer="4341" to-port="1" /> + <edge from-layer="4341" from-port="2" to-layer="4342" to-port="0" /> + <edge from-layer="4342" from-port="2" to-layer="4372" to-port="1" /> + <edge from-layer="4342" from-port="2" to-layer="4344" to-port="0" /> + <edge from-layer="4343" from-port="0" to-layer="4344" to-port="1" /> + <edge from-layer="4344" from-port="2" to-layer="4346" to-port="0" /> + <edge from-layer="4345" from-port="0" to-layer="4346" to-port="1" /> + <edge from-layer="4346" from-port="2" to-layer="4348" to-port="0" /> + <edge from-layer="4347" from-port="0" to-layer="4348" to-port="1" /> + <edge from-layer="4348" from-port="2" to-layer="4357" to-port="0" /> + <edge from-layer="4349" from-port="0" to-layer="4350" to-port="0" /> + <edge from-layer="4350" from-port="1" to-layer="4353" to-port="0" /> + <edge from-layer="4351" from-port="0" to-layer="4352" to-port="0" /> + <edge from-layer="4352" from-port="1" to-layer="4353" to-port="1" /> + <edge from-layer="4353" from-port="2" to-layer="4355" to-port="0" /> + <edge from-layer="4354" from-port="0" to-layer="4355" to-port="1" /> + <edge from-layer="4355" from-port="2" to-layer="4356" to-port="0" /> + <edge from-layer="4356" from-port="1" to-layer="4357" to-port="1" /> + <edge from-layer="4357" from-port="2" to-layer="4359" to-port="0" /> + <edge from-layer="4358" from-port="0" to-layer="4359" to-port="1" /> + <edge from-layer="4359" from-port="2" to-layer="4360" to-port="0" /> + <edge from-layer="4360" from-port="1" to-layer="4369" to-port="0" /> + <edge from-layer="4361" from-port="0" to-layer="4362" to-port="0" /> + <edge from-layer="4362" from-port="1" to-layer="4365" to-port="0" /> + <edge from-layer="4363" from-port="0" to-layer="4364" to-port="0" /> + <edge from-layer="4364" from-port="1" to-layer="4365" to-port="1" /> + <edge from-layer="4365" from-port="2" to-layer="4367" to-port="0" /> + <edge from-layer="4366" from-port="0" to-layer="4367" to-port="1" /> + <edge from-layer="4367" from-port="2" to-layer="4368" to-port="0" /> + <edge from-layer="4368" from-port="1" to-layer="4369" to-port="1" /> + <edge from-layer="4369" from-port="2" to-layer="4371" to-port="0" /> + <edge from-layer="4370" from-port="0" to-layer="4371" to-port="1" /> + <edge from-layer="4371" from-port="2" to-layer="4372" to-port="0" /> + <edge from-layer="4372" from-port="2" to-layer="4374" to-port="0" /> + <edge from-layer="4372" from-port="2" to-layer="4569" to-port="1" /> + <edge from-layer="4373" from-port="0" to-layer="4374" to-port="1" /> + <edge from-layer="4374" from-port="2" to-layer="4376" to-port="0" /> + <edge from-layer="4375" from-port="0" to-layer="4376" to-port="1" /> + <edge from-layer="4376" from-port="2" to-layer="4378" to-port="0" /> + <edge from-layer="4377" from-port="0" to-layer="4378" to-port="1" /> + <edge from-layer="4378" from-port="2" to-layer="4387" to-port="0" /> + <edge from-layer="4379" from-port="0" to-layer="4380" to-port="0" /> + <edge from-layer="4380" from-port="1" to-layer="4383" to-port="0" /> + <edge from-layer="4381" from-port="0" to-layer="4382" to-port="0" /> + <edge from-layer="4382" from-port="1" to-layer="4383" to-port="1" /> + <edge from-layer="4383" from-port="2" to-layer="4385" to-port="0" /> + <edge from-layer="4384" from-port="0" to-layer="4385" to-port="1" /> + <edge from-layer="4385" from-port="2" to-layer="4386" to-port="0" /> + <edge from-layer="4386" from-port="1" to-layer="4387" to-port="1" /> + <edge from-layer="4387" from-port="2" to-layer="4389" to-port="0" /> + <edge from-layer="4388" from-port="0" to-layer="4389" to-port="1" /> + <edge from-layer="4389" from-port="2" to-layer="4391" to-port="0" /> + <edge from-layer="4390" from-port="0" to-layer="4391" to-port="1" /> + <edge from-layer="4391" from-port="2" to-layer="4407" to-port="0" /> + <edge from-layer="4391" from-port="2" to-layer="4395" to-port="0" /> + <edge from-layer="4391" from-port="2" to-layer="4505" to-port="0" /> + <edge from-layer="4392" from-port="0" to-layer="4395" to-port="1" /> + <edge from-layer="4393" from-port="0" to-layer="4395" to-port="2" /> + <edge from-layer="4394" from-port="0" to-layer="4395" to-port="3" /> + <edge from-layer="4395" from-port="4" to-layer="4397" to-port="0" /> + <edge from-layer="4396" from-port="0" to-layer="4397" to-port="1" /> + <edge from-layer="4397" from-port="2" to-layer="4401" to-port="0" /> + <edge from-layer="4398" from-port="0" to-layer="4401" to-port="1" /> + <edge from-layer="4399" from-port="0" to-layer="4401" to-port="2" /> + <edge from-layer="4400" from-port="0" to-layer="4401" to-port="3" /> + <edge from-layer="4401" from-port="4" to-layer="4447" to-port="0" /> + <edge from-layer="4401" from-port="4" to-layer="4433" to-port="0" /> + <edge from-layer="4401" from-port="4" to-layer="4452" to-port="0" /> + <edge from-layer="4401" from-port="4" to-layer="4436" to-port="0" /> + <edge from-layer="4402" from-port="0" to-layer="4429" to-port="0" /> + <edge from-layer="4403" from-port="0" to-layer="4429" to-port="1" /> + <edge from-layer="4404" from-port="0" to-layer="4407" to-port="1" /> + <edge from-layer="4405" from-port="0" to-layer="4407" to-port="2" /> + <edge from-layer="4406" from-port="0" to-layer="4407" to-port="3" /> + <edge from-layer="4407" from-port="4" to-layer="4408" to-port="0" /> + <edge from-layer="4407" from-port="4" to-layer="4464" to-port="0" /> + <edge from-layer="4408" from-port="1" to-layer="4411" to-port="0" /> + <edge from-layer="4409" from-port="0" to-layer="4411" to-port="1" /> + <edge from-layer="4410" from-port="0" to-layer="4411" to-port="2" /> + <edge from-layer="4411" from-port="3" to-layer="4427" to-port="0" /> + <edge from-layer="4412" from-port="0" to-layer="4417" to-port="0" /> + <edge from-layer="4413" from-port="0" to-layer="4416" to-port="1" /> + <edge from-layer="4414" from-port="0" to-layer="4416" to-port="2" /> + <edge from-layer="4415" from-port="0" to-layer="4416" to-port="3" /> + <edge from-layer="4416" from-port="4" to-layer="4417" to-port="1" /> + <edge from-layer="4417" from-port="2" to-layer="4418" to-port="0" /> + <edge from-layer="4418" from-port="1" to-layer="4420" to-port="0" /> + <edge from-layer="4419" from-port="0" to-layer="4420" to-port="2" /> + <edge from-layer="4420" from-port="3" to-layer="4421" to-port="0" /> + <edge from-layer="4420" from-port="3" to-layer="4492" to-port="0" /> + <edge from-layer="4421" from-port="1" to-layer="4424" to-port="0" /> + <edge from-layer="4422" from-port="0" to-layer="4424" to-port="1" /> + <edge from-layer="4423" from-port="0" to-layer="4424" to-port="2" /> + <edge from-layer="4424" from-port="3" to-layer="4516" to-port="0" /> + <edge from-layer="4424" from-port="3" to-layer="4426" to-port="0" /> + <edge from-layer="4425" from-port="0" to-layer="4426" to-port="1" /> + <edge from-layer="4426" from-port="2" to-layer="4427" to-port="1" /> + <edge from-layer="4427" from-port="2" to-layer="4457" to-port="2" /> + <edge from-layer="4427" from-port="2" to-layer="4429" to-port="2" /> + <edge from-layer="4428" from-port="0" to-layer="4429" to-port="3" /> + <edge from-layer="4429" from-port="4" to-layer="4431" to-port="0" /> + <edge from-layer="4430" from-port="0" to-layer="4431" to-port="2" /> + <edge from-layer="4431" from-port="3" to-layer="4432" to-port="0" /> + <edge from-layer="4432" from-port="2" to-layer="4469" to-port="1" /> + <edge from-layer="4432" from-port="2" to-layer="4433" to-port="1" /> + <edge from-layer="4433" from-port="2" to-layer="4462" to-port="0" /> + <edge from-layer="4434" from-port="0" to-layer="4444" to-port="0" /> + <edge from-layer="4435" from-port="0" to-layer="4444" to-port="1" /> + <edge from-layer="4436" from-port="1" to-layer="4438" to-port="0" /> + <edge from-layer="4437" from-port="0" to-layer="4438" to-port="2" /> + <edge from-layer="4438" from-port="3" to-layer="4439" to-port="0" /> + <edge from-layer="4439" from-port="2" to-layer="4440" to-port="0" /> + <edge from-layer="4440" from-port="1" to-layer="4442" to-port="0" /> + <edge from-layer="4441" from-port="0" to-layer="4442" to-port="1" /> + <edge from-layer="4442" from-port="2" to-layer="4444" to-port="2" /> + <edge from-layer="4443" from-port="0" to-layer="4444" to-port="3" /> + <edge from-layer="4444" from-port="4" to-layer="4452" to-port="2" /> + <edge from-layer="4444" from-port="4" to-layer="4447" to-port="1" /> + <edge from-layer="4445" from-port="0" to-layer="4447" to-port="2" /> + <edge from-layer="4446" from-port="0" to-layer="4447" to-port="3" /> + <edge from-layer="4447" from-port="4" to-layer="4449" to-port="0" /> + <edge from-layer="4448" from-port="0" to-layer="4449" to-port="1" /> + <edge from-layer="4449" from-port="2" to-layer="4453" to-port="0" /> + <edge from-layer="4450" from-port="0" to-layer="4452" to-port="1" /> + <edge from-layer="4451" from-port="0" to-layer="4452" to-port="3" /> + <edge from-layer="4452" from-port="4" to-layer="4453" to-port="1" /> + <edge from-layer="4453" from-port="2" to-layer="4461" to-port="0" /> + <edge from-layer="4454" from-port="0" to-layer="4457" to-port="0" /> + <edge from-layer="4455" from-port="0" to-layer="4457" to-port="1" /> + <edge from-layer="4456" from-port="0" to-layer="4457" to-port="3" /> + <edge from-layer="4457" from-port="4" to-layer="4459" to-port="0" /> + <edge from-layer="4458" from-port="0" to-layer="4459" to-port="2" /> + <edge from-layer="4459" from-port="3" to-layer="4460" to-port="0" /> + <edge from-layer="4460" from-port="2" to-layer="4461" to-port="1" /> + <edge from-layer="4460" from-port="2" to-layer="4490" to-port="1" /> + <edge from-layer="4461" from-port="2" to-layer="4462" to-port="1" /> + <edge from-layer="4462" from-port="2" to-layer="4517" to-port="0" /> + <edge from-layer="4462" from-port="2" to-layer="4553" to-port="0" /> + <edge from-layer="4463" from-port="0" to-layer="4464" to-port="1" /> + <edge from-layer="4464" from-port="2" to-layer="4468" to-port="0" /> + <edge from-layer="4465" from-port="0" to-layer="4468" to-port="1" /> + <edge from-layer="4466" from-port="0" to-layer="4468" to-port="2" /> + <edge from-layer="4467" from-port="0" to-layer="4468" to-port="3" /> + <edge from-layer="4468" from-port="4" to-layer="4483" to-port="0" /> + <edge from-layer="4468" from-port="4" to-layer="4488" to-port="0" /> + <edge from-layer="4468" from-port="4" to-layer="4472" to-port="0" /> + <edge from-layer="4468" from-port="4" to-layer="4469" to-port="0" /> + <edge from-layer="4469" from-port="2" to-layer="4491" to-port="0" /> + <edge from-layer="4470" from-port="0" to-layer="4480" to-port="0" /> + <edge from-layer="4471" from-port="0" to-layer="4480" to-port="1" /> + <edge from-layer="4472" from-port="1" to-layer="4474" to-port="0" /> + <edge from-layer="4473" from-port="0" to-layer="4474" to-port="2" /> + <edge from-layer="4474" from-port="3" to-layer="4475" to-port="0" /> + <edge from-layer="4475" from-port="2" to-layer="4476" to-port="0" /> + <edge from-layer="4476" from-port="1" to-layer="4478" to-port="0" /> + <edge from-layer="4477" from-port="0" to-layer="4478" to-port="1" /> + <edge from-layer="4478" from-port="2" to-layer="4480" to-port="2" /> + <edge from-layer="4479" from-port="0" to-layer="4480" to-port="3" /> + <edge from-layer="4480" from-port="4" to-layer="4488" to-port="2" /> + <edge from-layer="4480" from-port="4" to-layer="4483" to-port="1" /> + <edge from-layer="4481" from-port="0" to-layer="4483" to-port="2" /> + <edge from-layer="4482" from-port="0" to-layer="4483" to-port="3" /> + <edge from-layer="4483" from-port="4" to-layer="4485" to-port="0" /> + <edge from-layer="4484" from-port="0" to-layer="4485" to-port="1" /> + <edge from-layer="4485" from-port="2" to-layer="4489" to-port="0" /> + <edge from-layer="4486" from-port="0" to-layer="4488" to-port="1" /> + <edge from-layer="4487" from-port="0" to-layer="4488" to-port="3" /> + <edge from-layer="4488" from-port="4" to-layer="4489" to-port="1" /> + <edge from-layer="4489" from-port="2" to-layer="4490" to-port="0" /> + <edge from-layer="4490" from-port="2" to-layer="4491" to-port="1" /> + <edge from-layer="4491" from-port="2" to-layer="4492" to-port="1" /> + <edge from-layer="4491" from-port="2" to-layer="4512" to-port="0" /> + <edge from-layer="4492" from-port="2" to-layer="7218" to-port="0" /> + <edge from-layer="4492" from-port="2" to-layer="4553" to-port="1" /> + <edge from-layer="4493" from-port="0" to-layer="4498" to-port="0" /> + <edge from-layer="4494" from-port="0" to-layer="4497" to-port="1" /> + <edge from-layer="4495" from-port="0" to-layer="4497" to-port="2" /> + <edge from-layer="4496" from-port="0" to-layer="4497" to-port="3" /> + <edge from-layer="4497" from-port="4" to-layer="4498" to-port="1" /> + <edge from-layer="4498" from-port="2" to-layer="4499" to-port="0" /> + <edge from-layer="4499" from-port="1" to-layer="4501" to-port="0" /> + <edge from-layer="4500" from-port="0" to-layer="4501" to-port="2" /> + <edge from-layer="4501" from-port="3" to-layer="4508" to-port="0" /> + <edge from-layer="4502" from-port="0" to-layer="4505" to-port="1" /> + <edge from-layer="4503" from-port="0" to-layer="4505" to-port="2" /> + <edge from-layer="4504" from-port="0" to-layer="4505" to-port="3" /> + <edge from-layer="4505" from-port="4" to-layer="4507" to-port="0" /> + <edge from-layer="4506" from-port="0" to-layer="4507" to-port="1" /> + <edge from-layer="4507" from-port="2" to-layer="4508" to-port="1" /> + <edge from-layer="4508" from-port="2" to-layer="4553" to-port="2" /> + <edge from-layer="4508" from-port="2" to-layer="7217" to-port="0" /> + <edge from-layer="4509" from-port="0" to-layer="4531" to-port="0" /> + <edge from-layer="4510" from-port="0" to-layer="4525" to-port="0" /> + <edge from-layer="4511" from-port="0" to-layer="4525" to-port="1" /> + <edge from-layer="4511" from-port="0" to-layer="4529" to-port="1" /> + <edge from-layer="4512" from-port="1" to-layer="4515" to-port="0" /> + <edge from-layer="4513" from-port="0" to-layer="4515" to-port="1" /> + <edge from-layer="4514" from-port="0" to-layer="4515" to-port="2" /> + <edge from-layer="4515" from-port="3" to-layer="4516" to-port="1" /> + <edge from-layer="4516" from-port="2" to-layer="4521" to-port="0" /> + <edge from-layer="4516" from-port="2" to-layer="4528" to-port="0" /> + <edge from-layer="4517" from-port="1" to-layer="4546" to-port="0" /> + <edge from-layer="4517" from-port="1" to-layer="4520" to-port="0" /> + <edge from-layer="4518" from-port="0" to-layer="4520" to-port="1" /> + <edge from-layer="4519" from-port="0" to-layer="4520" to-port="2" /> + <edge from-layer="4520" from-port="3" to-layer="4521" to-port="1" /> + <edge from-layer="4521" from-port="2" to-layer="4523" to-port="0" /> + <edge from-layer="4522" from-port="0" to-layer="4523" to-port="1" /> + <edge from-layer="4523" from-port="2" to-layer="4525" to-port="2" /> + <edge from-layer="4524" from-port="0" to-layer="4529" to-port="3" /> + <edge from-layer="4524" from-port="0" to-layer="4525" to-port="3" /> + <edge from-layer="4525" from-port="4" to-layer="4531" to-port="1" /> + <edge from-layer="4526" from-port="0" to-layer="4529" to-port="0" /> + <edge from-layer="4527" from-port="0" to-layer="4528" to-port="1" /> + <edge from-layer="4528" from-port="2" to-layer="4529" to-port="2" /> + <edge from-layer="4528" from-port="2" to-layer="4536" to-port="2" /> + <edge from-layer="4529" from-port="4" to-layer="4531" to-port="2" /> + <edge from-layer="4530" from-port="0" to-layer="4531" to-port="3" /> + <edge from-layer="4531" from-port="4" to-layer="4538" to-port="0" /> + <edge from-layer="4532" from-port="0" to-layer="4538" to-port="1" /> + <edge from-layer="4533" from-port="0" to-layer="4536" to-port="0" /> + <edge from-layer="4534" from-port="0" to-layer="4536" to-port="1" /> + <edge from-layer="4535" from-port="0" to-layer="4536" to-port="3" /> + <edge from-layer="4536" from-port="4" to-layer="4538" to-port="2" /> + <edge from-layer="4537" from-port="0" to-layer="4538" to-port="3" /> + <edge from-layer="4538" from-port="4" to-layer="4541" to-port="0" /> + <edge from-layer="4539" from-port="0" to-layer="4541" to-port="1" /> + <edge from-layer="4540" from-port="0" to-layer="4541" to-port="2" /> + <edge from-layer="4541" from-port="3" to-layer="4542" to-port="0" /> + <edge from-layer="4542" from-port="2" to-layer="4552" to-port="0" /> + <edge from-layer="4542" from-port="2" to-layer="4543" to-port="0" /> + <edge from-layer="4543" from-port="1" to-layer="4551" to-port="0" /> + <edge from-layer="4544" from-port="0" to-layer="4546" to-port="1" /> + <edge from-layer="4545" from-port="0" to-layer="4546" to-port="2" /> + <edge from-layer="4546" from-port="3" to-layer="4550" to-port="0" /> + <edge from-layer="4547" from-port="0" to-layer="4550" to-port="1" /> + <edge from-layer="4548" from-port="0" to-layer="4550" to-port="2" /> + <edge from-layer="4549" from-port="0" to-layer="4550" to-port="3" /> + <edge from-layer="4550" from-port="4" to-layer="4551" to-port="1" /> + <edge from-layer="4551" from-port="2" to-layer="4552" to-port="1" /> + <edge from-layer="4552" from-port="2" to-layer="4553" to-port="3" /> + <edge from-layer="4553" from-port="4" to-layer="4555" to-port="0" /> + <edge from-layer="4554" from-port="0" to-layer="4555" to-port="1" /> + <edge from-layer="4555" from-port="2" to-layer="4557" to-port="0" /> + <edge from-layer="4556" from-port="0" to-layer="4557" to-port="1" /> + <edge from-layer="4557" from-port="2" to-layer="4566" to-port="0" /> + <edge from-layer="4558" from-port="0" to-layer="4559" to-port="0" /> + <edge from-layer="4559" from-port="1" to-layer="4562" to-port="0" /> + <edge from-layer="4560" from-port="0" to-layer="4561" to-port="0" /> + <edge from-layer="4561" from-port="1" to-layer="4562" to-port="1" /> + <edge from-layer="4562" from-port="2" to-layer="4564" to-port="0" /> + <edge from-layer="4563" from-port="0" to-layer="4564" to-port="1" /> + <edge from-layer="4564" from-port="2" to-layer="4565" to-port="0" /> + <edge from-layer="4565" from-port="1" to-layer="4566" to-port="1" /> + <edge from-layer="4566" from-port="2" to-layer="4568" to-port="0" /> + <edge from-layer="4567" from-port="0" to-layer="4568" to-port="1" /> + <edge from-layer="4568" from-port="2" to-layer="4569" to-port="0" /> + <edge from-layer="4569" from-port="2" to-layer="4571" to-port="0" /> + <edge from-layer="4569" from-port="2" to-layer="4599" to-port="1" /> + <edge from-layer="4570" from-port="0" to-layer="4571" to-port="1" /> + <edge from-layer="4571" from-port="2" to-layer="4573" to-port="0" /> + <edge from-layer="4572" from-port="0" to-layer="4573" to-port="1" /> + <edge from-layer="4573" from-port="2" to-layer="4575" to-port="0" /> + <edge from-layer="4574" from-port="0" to-layer="4575" to-port="1" /> + <edge from-layer="4575" from-port="2" to-layer="4584" to-port="0" /> + <edge from-layer="4576" from-port="0" to-layer="4577" to-port="0" /> + <edge from-layer="4577" from-port="1" to-layer="4580" to-port="0" /> + <edge from-layer="4578" from-port="0" to-layer="4579" to-port="0" /> + <edge from-layer="4579" from-port="1" to-layer="4580" to-port="1" /> + <edge from-layer="4580" from-port="2" to-layer="4582" to-port="0" /> + <edge from-layer="4581" from-port="0" to-layer="4582" to-port="1" /> + <edge from-layer="4582" from-port="2" to-layer="4583" to-port="0" /> + <edge from-layer="4583" from-port="1" to-layer="4584" to-port="1" /> + <edge from-layer="4584" from-port="2" to-layer="4586" to-port="0" /> + <edge from-layer="4585" from-port="0" to-layer="4586" to-port="1" /> + <edge from-layer="4586" from-port="2" to-layer="4587" to-port="0" /> + <edge from-layer="4587" from-port="1" to-layer="4596" to-port="0" /> + <edge from-layer="4588" from-port="0" to-layer="4589" to-port="0" /> + <edge from-layer="4589" from-port="1" to-layer="4592" to-port="0" /> + <edge from-layer="4590" from-port="0" to-layer="4591" to-port="0" /> + <edge from-layer="4591" from-port="1" to-layer="4592" to-port="1" /> + <edge from-layer="4592" from-port="2" to-layer="4594" to-port="0" /> + <edge from-layer="4593" from-port="0" to-layer="4594" to-port="1" /> + <edge from-layer="4594" from-port="2" to-layer="4595" to-port="0" /> + <edge from-layer="4595" from-port="1" to-layer="4596" to-port="1" /> + <edge from-layer="4596" from-port="2" to-layer="4598" to-port="0" /> + <edge from-layer="4597" from-port="0" to-layer="4598" to-port="1" /> + <edge from-layer="4598" from-port="2" to-layer="4599" to-port="0" /> + <edge from-layer="4599" from-port="2" to-layer="4796" to-port="1" /> + <edge from-layer="4599" from-port="2" to-layer="4601" to-port="0" /> + <edge from-layer="4600" from-port="0" to-layer="4601" to-port="1" /> + <edge from-layer="4601" from-port="2" to-layer="4603" to-port="0" /> + <edge from-layer="4602" from-port="0" to-layer="4603" to-port="1" /> + <edge from-layer="4603" from-port="2" to-layer="4605" to-port="0" /> + <edge from-layer="4604" from-port="0" to-layer="4605" to-port="1" /> + <edge from-layer="4605" from-port="2" to-layer="4614" to-port="0" /> + <edge from-layer="4606" from-port="0" to-layer="4607" to-port="0" /> + <edge from-layer="4607" from-port="1" to-layer="4610" to-port="0" /> + <edge from-layer="4608" from-port="0" to-layer="4609" to-port="0" /> + <edge from-layer="4609" from-port="1" to-layer="4610" to-port="1" /> + <edge from-layer="4610" from-port="2" to-layer="4612" to-port="0" /> + <edge from-layer="4611" from-port="0" to-layer="4612" to-port="1" /> + <edge from-layer="4612" from-port="2" to-layer="4613" to-port="0" /> + <edge from-layer="4613" from-port="1" to-layer="4614" to-port="1" /> + <edge from-layer="4614" from-port="2" to-layer="4616" to-port="0" /> + <edge from-layer="4615" from-port="0" to-layer="4616" to-port="1" /> + <edge from-layer="4616" from-port="2" to-layer="4618" to-port="0" /> + <edge from-layer="4617" from-port="0" to-layer="4618" to-port="1" /> + <edge from-layer="4618" from-port="2" to-layer="4634" to-port="0" /> + <edge from-layer="4618" from-port="2" to-layer="4732" to-port="0" /> + <edge from-layer="4618" from-port="2" to-layer="4622" to-port="0" /> + <edge from-layer="4619" from-port="0" to-layer="4622" to-port="1" /> + <edge from-layer="4620" from-port="0" to-layer="4622" to-port="2" /> + <edge from-layer="4621" from-port="0" to-layer="4622" to-port="3" /> + <edge from-layer="4622" from-port="4" to-layer="4624" to-port="0" /> + <edge from-layer="4623" from-port="0" to-layer="4624" to-port="1" /> + <edge from-layer="4624" from-port="2" to-layer="4628" to-port="0" /> + <edge from-layer="4625" from-port="0" to-layer="4628" to-port="1" /> + <edge from-layer="4626" from-port="0" to-layer="4628" to-port="2" /> + <edge from-layer="4627" from-port="0" to-layer="4628" to-port="3" /> + <edge from-layer="4628" from-port="4" to-layer="4663" to-port="0" /> + <edge from-layer="4628" from-port="4" to-layer="4679" to-port="0" /> + <edge from-layer="4628" from-port="4" to-layer="4660" to-port="0" /> + <edge from-layer="4628" from-port="4" to-layer="4674" to-port="0" /> + <edge from-layer="4629" from-port="0" to-layer="4656" to-port="0" /> + <edge from-layer="4630" from-port="0" to-layer="4656" to-port="1" /> + <edge from-layer="4631" from-port="0" to-layer="4634" to-port="1" /> + <edge from-layer="4632" from-port="0" to-layer="4634" to-port="2" /> + <edge from-layer="4633" from-port="0" to-layer="4634" to-port="3" /> + <edge from-layer="4634" from-port="4" to-layer="4691" to-port="0" /> + <edge from-layer="4634" from-port="4" to-layer="4635" to-port="0" /> + <edge from-layer="4635" from-port="1" to-layer="4638" to-port="0" /> + <edge from-layer="4636" from-port="0" to-layer="4638" to-port="1" /> + <edge from-layer="4637" from-port="0" to-layer="4638" to-port="2" /> + <edge from-layer="4638" from-port="3" to-layer="4654" to-port="0" /> + <edge from-layer="4639" from-port="0" to-layer="4644" to-port="0" /> + <edge from-layer="4640" from-port="0" to-layer="4643" to-port="1" /> + <edge from-layer="4641" from-port="0" to-layer="4643" to-port="2" /> + <edge from-layer="4642" from-port="0" to-layer="4643" to-port="3" /> + <edge from-layer="4643" from-port="4" to-layer="4644" to-port="1" /> + <edge from-layer="4644" from-port="2" to-layer="4645" to-port="0" /> + <edge from-layer="4645" from-port="1" to-layer="4647" to-port="0" /> + <edge from-layer="4646" from-port="0" to-layer="4647" to-port="2" /> + <edge from-layer="4647" from-port="3" to-layer="4648" to-port="0" /> + <edge from-layer="4647" from-port="3" to-layer="4719" to-port="0" /> + <edge from-layer="4648" from-port="1" to-layer="4651" to-port="0" /> + <edge from-layer="4649" from-port="0" to-layer="4651" to-port="1" /> + <edge from-layer="4650" from-port="0" to-layer="4651" to-port="2" /> + <edge from-layer="4651" from-port="3" to-layer="4653" to-port="0" /> + <edge from-layer="4651" from-port="3" to-layer="4743" to-port="0" /> + <edge from-layer="4652" from-port="0" to-layer="4653" to-port="1" /> + <edge from-layer="4653" from-port="2" to-layer="4654" to-port="1" /> + <edge from-layer="4654" from-port="2" to-layer="4656" to-port="2" /> + <edge from-layer="4654" from-port="2" to-layer="4684" to-port="2" /> + <edge from-layer="4655" from-port="0" to-layer="4656" to-port="3" /> + <edge from-layer="4656" from-port="4" to-layer="4658" to-port="0" /> + <edge from-layer="4657" from-port="0" to-layer="4658" to-port="2" /> + <edge from-layer="4658" from-port="3" to-layer="4659" to-port="0" /> + <edge from-layer="4659" from-port="2" to-layer="4660" to-port="1" /> + <edge from-layer="4659" from-port="2" to-layer="4696" to-port="1" /> + <edge from-layer="4660" from-port="2" to-layer="4689" to-port="0" /> + <edge from-layer="4661" from-port="0" to-layer="4671" to-port="0" /> + <edge from-layer="4662" from-port="0" to-layer="4671" to-port="1" /> + <edge from-layer="4663" from-port="1" to-layer="4665" to-port="0" /> + <edge from-layer="4664" from-port="0" to-layer="4665" to-port="2" /> + <edge from-layer="4665" from-port="3" to-layer="4666" to-port="0" /> + <edge from-layer="4666" from-port="2" to-layer="4667" to-port="0" /> + <edge from-layer="4667" from-port="1" to-layer="4669" to-port="0" /> + <edge from-layer="4668" from-port="0" to-layer="4669" to-port="1" /> + <edge from-layer="4669" from-port="2" to-layer="4671" to-port="2" /> + <edge from-layer="4670" from-port="0" to-layer="4671" to-port="3" /> + <edge from-layer="4671" from-port="4" to-layer="4674" to-port="1" /> + <edge from-layer="4671" from-port="4" to-layer="4679" to-port="2" /> + <edge from-layer="4672" from-port="0" to-layer="4674" to-port="2" /> + <edge from-layer="4673" from-port="0" to-layer="4674" to-port="3" /> + <edge from-layer="4674" from-port="4" to-layer="4676" to-port="0" /> + <edge from-layer="4675" from-port="0" to-layer="4676" to-port="1" /> + <edge from-layer="4676" from-port="2" to-layer="4680" to-port="0" /> + <edge from-layer="4677" from-port="0" to-layer="4679" to-port="1" /> + <edge from-layer="4678" from-port="0" to-layer="4679" to-port="3" /> + <edge from-layer="4679" from-port="4" to-layer="4680" to-port="1" /> + <edge from-layer="4680" from-port="2" to-layer="4688" to-port="0" /> + <edge from-layer="4681" from-port="0" to-layer="4684" to-port="0" /> + <edge from-layer="4682" from-port="0" to-layer="4684" to-port="1" /> + <edge from-layer="4683" from-port="0" to-layer="4684" to-port="3" /> + <edge from-layer="4684" from-port="4" to-layer="4686" to-port="0" /> + <edge from-layer="4685" from-port="0" to-layer="4686" to-port="2" /> + <edge from-layer="4686" from-port="3" to-layer="4687" to-port="0" /> + <edge from-layer="4687" from-port="2" to-layer="4717" to-port="1" /> + <edge from-layer="4687" from-port="2" to-layer="4688" to-port="1" /> + <edge from-layer="4688" from-port="2" to-layer="4689" to-port="1" /> + <edge from-layer="4689" from-port="2" to-layer="4744" to-port="0" /> + <edge from-layer="4689" from-port="2" to-layer="4780" to-port="0" /> + <edge from-layer="4690" from-port="0" to-layer="4691" to-port="1" /> + <edge from-layer="4691" from-port="2" to-layer="4695" to-port="0" /> + <edge from-layer="4692" from-port="0" to-layer="4695" to-port="1" /> + <edge from-layer="4693" from-port="0" to-layer="4695" to-port="2" /> + <edge from-layer="4694" from-port="0" to-layer="4695" to-port="3" /> + <edge from-layer="4695" from-port="4" to-layer="4710" to-port="0" /> + <edge from-layer="4695" from-port="4" to-layer="4715" to-port="0" /> + <edge from-layer="4695" from-port="4" to-layer="4699" to-port="0" /> + <edge from-layer="4695" from-port="4" to-layer="4696" to-port="0" /> + <edge from-layer="4696" from-port="2" to-layer="4718" to-port="0" /> + <edge from-layer="4697" from-port="0" to-layer="4707" to-port="0" /> + <edge from-layer="4698" from-port="0" to-layer="4707" to-port="1" /> + <edge from-layer="4699" from-port="1" to-layer="4701" to-port="0" /> + <edge from-layer="4700" from-port="0" to-layer="4701" to-port="2" /> + <edge from-layer="4701" from-port="3" to-layer="4702" to-port="0" /> + <edge from-layer="4702" from-port="2" to-layer="4703" to-port="0" /> + <edge from-layer="4703" from-port="1" to-layer="4705" to-port="0" /> + <edge from-layer="4704" from-port="0" to-layer="4705" to-port="1" /> + <edge from-layer="4705" from-port="2" to-layer="4707" to-port="2" /> + <edge from-layer="4706" from-port="0" to-layer="4707" to-port="3" /> + <edge from-layer="4707" from-port="4" to-layer="4710" to-port="1" /> + <edge from-layer="4707" from-port="4" to-layer="4715" to-port="2" /> + <edge from-layer="4708" from-port="0" to-layer="4710" to-port="2" /> + <edge from-layer="4709" from-port="0" to-layer="4710" to-port="3" /> + <edge from-layer="4710" from-port="4" to-layer="4712" to-port="0" /> + <edge from-layer="4711" from-port="0" to-layer="4712" to-port="1" /> + <edge from-layer="4712" from-port="2" to-layer="4716" to-port="0" /> + <edge from-layer="4713" from-port="0" to-layer="4715" to-port="1" /> + <edge from-layer="4714" from-port="0" to-layer="4715" to-port="3" /> + <edge from-layer="4715" from-port="4" to-layer="4716" to-port="1" /> + <edge from-layer="4716" from-port="2" to-layer="4717" to-port="0" /> + <edge from-layer="4717" from-port="2" to-layer="4718" to-port="1" /> + <edge from-layer="4718" from-port="2" to-layer="4739" to-port="0" /> + <edge from-layer="4718" from-port="2" to-layer="4719" to-port="1" /> + <edge from-layer="4719" from-port="2" to-layer="7214" to-port="0" /> + <edge from-layer="4719" from-port="2" to-layer="4780" to-port="1" /> + <edge from-layer="4720" from-port="0" to-layer="4725" to-port="0" /> + <edge from-layer="4721" from-port="0" to-layer="4724" to-port="1" /> + <edge from-layer="4722" from-port="0" to-layer="4724" to-port="2" /> + <edge from-layer="4723" from-port="0" to-layer="4724" to-port="3" /> + <edge from-layer="4724" from-port="4" to-layer="4725" to-port="1" /> + <edge from-layer="4725" from-port="2" to-layer="4726" to-port="0" /> + <edge from-layer="4726" from-port="1" to-layer="4728" to-port="0" /> + <edge from-layer="4727" from-port="0" to-layer="4728" to-port="2" /> + <edge from-layer="4728" from-port="3" to-layer="4735" to-port="0" /> + <edge from-layer="4729" from-port="0" to-layer="4732" to-port="1" /> + <edge from-layer="4730" from-port="0" to-layer="4732" to-port="2" /> + <edge from-layer="4731" from-port="0" to-layer="4732" to-port="3" /> + <edge from-layer="4732" from-port="4" to-layer="4734" to-port="0" /> + <edge from-layer="4733" from-port="0" to-layer="4734" to-port="1" /> + <edge from-layer="4734" from-port="2" to-layer="4735" to-port="1" /> + <edge from-layer="4735" from-port="2" to-layer="4780" to-port="2" /> + <edge from-layer="4735" from-port="2" to-layer="7213" to-port="0" /> + <edge from-layer="4736" from-port="0" to-layer="4758" to-port="0" /> + <edge from-layer="4737" from-port="0" to-layer="4752" to-port="0" /> + <edge from-layer="4738" from-port="0" to-layer="4752" to-port="1" /> + <edge from-layer="4738" from-port="0" to-layer="4756" to-port="1" /> + <edge from-layer="4739" from-port="1" to-layer="4742" to-port="0" /> + <edge from-layer="4740" from-port="0" to-layer="4742" to-port="1" /> + <edge from-layer="4741" from-port="0" to-layer="4742" to-port="2" /> + <edge from-layer="4742" from-port="3" to-layer="4743" to-port="1" /> + <edge from-layer="4743" from-port="2" to-layer="4748" to-port="0" /> + <edge from-layer="4743" from-port="2" to-layer="4755" to-port="0" /> + <edge from-layer="4744" from-port="1" to-layer="4773" to-port="0" /> + <edge from-layer="4744" from-port="1" to-layer="4747" to-port="0" /> + <edge from-layer="4745" from-port="0" to-layer="4747" to-port="1" /> + <edge from-layer="4746" from-port="0" to-layer="4747" to-port="2" /> + <edge from-layer="4747" from-port="3" to-layer="4748" to-port="1" /> + <edge from-layer="4748" from-port="2" to-layer="4750" to-port="0" /> + <edge from-layer="4749" from-port="0" to-layer="4750" to-port="1" /> + <edge from-layer="4750" from-port="2" to-layer="4752" to-port="2" /> + <edge from-layer="4751" from-port="0" to-layer="4756" to-port="3" /> + <edge from-layer="4751" from-port="0" to-layer="4752" to-port="3" /> + <edge from-layer="4752" from-port="4" to-layer="4758" to-port="1" /> + <edge from-layer="4753" from-port="0" to-layer="4756" to-port="0" /> + <edge from-layer="4754" from-port="0" to-layer="4755" to-port="1" /> + <edge from-layer="4755" from-port="2" to-layer="4756" to-port="2" /> + <edge from-layer="4755" from-port="2" to-layer="4763" to-port="2" /> + <edge from-layer="4756" from-port="4" to-layer="4758" to-port="2" /> + <edge from-layer="4757" from-port="0" to-layer="4758" to-port="3" /> + <edge from-layer="4758" from-port="4" to-layer="4765" to-port="0" /> + <edge from-layer="4759" from-port="0" to-layer="4765" to-port="1" /> + <edge from-layer="4760" from-port="0" to-layer="4763" to-port="0" /> + <edge from-layer="4761" from-port="0" to-layer="4763" to-port="1" /> + <edge from-layer="4762" from-port="0" to-layer="4763" to-port="3" /> + <edge from-layer="4763" from-port="4" to-layer="4765" to-port="2" /> + <edge from-layer="4764" from-port="0" to-layer="4765" to-port="3" /> + <edge from-layer="4765" from-port="4" to-layer="4768" to-port="0" /> + <edge from-layer="4766" from-port="0" to-layer="4768" to-port="1" /> + <edge from-layer="4767" from-port="0" to-layer="4768" to-port="2" /> + <edge from-layer="4768" from-port="3" to-layer="4769" to-port="0" /> + <edge from-layer="4769" from-port="2" to-layer="4779" to-port="0" /> + <edge from-layer="4769" from-port="2" to-layer="4770" to-port="0" /> + <edge from-layer="4770" from-port="1" to-layer="4778" to-port="0" /> + <edge from-layer="4771" from-port="0" to-layer="4773" to-port="1" /> + <edge from-layer="4772" from-port="0" to-layer="4773" to-port="2" /> + <edge from-layer="4773" from-port="3" to-layer="4777" to-port="0" /> + <edge from-layer="4774" from-port="0" to-layer="4777" to-port="1" /> + <edge from-layer="4775" from-port="0" to-layer="4777" to-port="2" /> + <edge from-layer="4776" from-port="0" to-layer="4777" to-port="3" /> + <edge from-layer="4777" from-port="4" to-layer="4778" to-port="1" /> + <edge from-layer="4778" from-port="2" to-layer="4779" to-port="1" /> + <edge from-layer="4779" from-port="2" to-layer="4780" to-port="3" /> + <edge from-layer="4780" from-port="4" to-layer="4782" to-port="0" /> + <edge from-layer="4781" from-port="0" to-layer="4782" to-port="1" /> + <edge from-layer="4782" from-port="2" to-layer="4784" to-port="0" /> + <edge from-layer="4783" from-port="0" to-layer="4784" to-port="1" /> + <edge from-layer="4784" from-port="2" to-layer="4793" to-port="0" /> + <edge from-layer="4785" from-port="0" to-layer="4786" to-port="0" /> + <edge from-layer="4786" from-port="1" to-layer="4789" to-port="0" /> + <edge from-layer="4787" from-port="0" to-layer="4788" to-port="0" /> + <edge from-layer="4788" from-port="1" to-layer="4789" to-port="1" /> + <edge from-layer="4789" from-port="2" to-layer="4791" to-port="0" /> + <edge from-layer="4790" from-port="0" to-layer="4791" to-port="1" /> + <edge from-layer="4791" from-port="2" to-layer="4792" to-port="0" /> + <edge from-layer="4792" from-port="1" to-layer="4793" to-port="1" /> + <edge from-layer="4793" from-port="2" to-layer="4795" to-port="0" /> + <edge from-layer="4794" from-port="0" to-layer="4795" to-port="1" /> + <edge from-layer="4795" from-port="2" to-layer="4796" to-port="0" /> + <edge from-layer="4796" from-port="2" to-layer="4826" to-port="1" /> + <edge from-layer="4796" from-port="2" to-layer="4798" to-port="0" /> + <edge from-layer="4797" from-port="0" to-layer="4798" to-port="1" /> + <edge from-layer="4798" from-port="2" to-layer="4800" to-port="0" /> + <edge from-layer="4799" from-port="0" to-layer="4800" to-port="1" /> + <edge from-layer="4800" from-port="2" to-layer="4802" to-port="0" /> + <edge from-layer="4801" from-port="0" to-layer="4802" to-port="1" /> + <edge from-layer="4802" from-port="2" to-layer="4811" to-port="0" /> + <edge from-layer="4803" from-port="0" to-layer="4804" to-port="0" /> + <edge from-layer="4804" from-port="1" to-layer="4807" to-port="0" /> + <edge from-layer="4805" from-port="0" to-layer="4806" to-port="0" /> + <edge from-layer="4806" from-port="1" to-layer="4807" to-port="1" /> + <edge from-layer="4807" from-port="2" to-layer="4809" to-port="0" /> + <edge from-layer="4808" from-port="0" to-layer="4809" to-port="1" /> + <edge from-layer="4809" from-port="2" to-layer="4810" to-port="0" /> + <edge from-layer="4810" from-port="1" to-layer="4811" to-port="1" /> + <edge from-layer="4811" from-port="2" to-layer="4813" to-port="0" /> + <edge from-layer="4812" from-port="0" to-layer="4813" to-port="1" /> + <edge from-layer="4813" from-port="2" to-layer="4814" to-port="0" /> + <edge from-layer="4814" from-port="1" to-layer="4823" to-port="0" /> + <edge from-layer="4815" from-port="0" to-layer="4816" to-port="0" /> + <edge from-layer="4816" from-port="1" to-layer="4819" to-port="0" /> + <edge from-layer="4817" from-port="0" to-layer="4818" to-port="0" /> + <edge from-layer="4818" from-port="1" to-layer="4819" to-port="1" /> + <edge from-layer="4819" from-port="2" to-layer="4821" to-port="0" /> + <edge from-layer="4820" from-port="0" to-layer="4821" to-port="1" /> + <edge from-layer="4821" from-port="2" to-layer="4822" to-port="0" /> + <edge from-layer="4822" from-port="1" to-layer="4823" to-port="1" /> + <edge from-layer="4823" from-port="2" to-layer="4825" to-port="0" /> + <edge from-layer="4824" from-port="0" to-layer="4825" to-port="1" /> + <edge from-layer="4825" from-port="2" to-layer="4826" to-port="0" /> + <edge from-layer="4826" from-port="2" to-layer="5023" to-port="1" /> + <edge from-layer="4826" from-port="2" to-layer="4828" to-port="0" /> + <edge from-layer="4827" from-port="0" to-layer="4828" to-port="1" /> + <edge from-layer="4828" from-port="2" to-layer="4830" to-port="0" /> + <edge from-layer="4829" from-port="0" to-layer="4830" to-port="1" /> + <edge from-layer="4830" from-port="2" to-layer="4832" to-port="0" /> + <edge from-layer="4831" from-port="0" to-layer="4832" to-port="1" /> + <edge from-layer="4832" from-port="2" to-layer="4841" to-port="0" /> + <edge from-layer="4833" from-port="0" to-layer="4834" to-port="0" /> + <edge from-layer="4834" from-port="1" to-layer="4837" to-port="0" /> + <edge from-layer="4835" from-port="0" to-layer="4836" to-port="0" /> + <edge from-layer="4836" from-port="1" to-layer="4837" to-port="1" /> + <edge from-layer="4837" from-port="2" to-layer="4839" to-port="0" /> + <edge from-layer="4838" from-port="0" to-layer="4839" to-port="1" /> + <edge from-layer="4839" from-port="2" to-layer="4840" to-port="0" /> + <edge from-layer="4840" from-port="1" to-layer="4841" to-port="1" /> + <edge from-layer="4841" from-port="2" to-layer="4843" to-port="0" /> + <edge from-layer="4842" from-port="0" to-layer="4843" to-port="1" /> + <edge from-layer="4843" from-port="2" to-layer="4845" to-port="0" /> + <edge from-layer="4844" from-port="0" to-layer="4845" to-port="1" /> + <edge from-layer="4845" from-port="2" to-layer="4959" to-port="0" /> + <edge from-layer="4845" from-port="2" to-layer="4849" to-port="0" /> + <edge from-layer="4845" from-port="2" to-layer="4861" to-port="0" /> + <edge from-layer="4846" from-port="0" to-layer="4849" to-port="1" /> + <edge from-layer="4847" from-port="0" to-layer="4849" to-port="2" /> + <edge from-layer="4848" from-port="0" to-layer="4849" to-port="3" /> + <edge from-layer="4849" from-port="4" to-layer="4851" to-port="0" /> + <edge from-layer="4850" from-port="0" to-layer="4851" to-port="1" /> + <edge from-layer="4851" from-port="2" to-layer="4855" to-port="0" /> + <edge from-layer="4852" from-port="0" to-layer="4855" to-port="1" /> + <edge from-layer="4853" from-port="0" to-layer="4855" to-port="2" /> + <edge from-layer="4854" from-port="0" to-layer="4855" to-port="3" /> + <edge from-layer="4855" from-port="4" to-layer="4887" to-port="0" /> + <edge from-layer="4855" from-port="4" to-layer="4890" to-port="0" /> + <edge from-layer="4855" from-port="4" to-layer="4901" to-port="0" /> + <edge from-layer="4855" from-port="4" to-layer="4906" to-port="0" /> + <edge from-layer="4856" from-port="0" to-layer="4883" to-port="0" /> + <edge from-layer="4857" from-port="0" to-layer="4883" to-port="1" /> + <edge from-layer="4858" from-port="0" to-layer="4861" to-port="1" /> + <edge from-layer="4859" from-port="0" to-layer="4861" to-port="2" /> + <edge from-layer="4860" from-port="0" to-layer="4861" to-port="3" /> + <edge from-layer="4861" from-port="4" to-layer="4862" to-port="0" /> + <edge from-layer="4861" from-port="4" to-layer="4918" to-port="0" /> + <edge from-layer="4862" from-port="1" to-layer="4865" to-port="0" /> + <edge from-layer="4863" from-port="0" to-layer="4865" to-port="1" /> + <edge from-layer="4864" from-port="0" to-layer="4865" to-port="2" /> + <edge from-layer="4865" from-port="3" to-layer="4881" to-port="0" /> + <edge from-layer="4866" from-port="0" to-layer="4871" to-port="0" /> + <edge from-layer="4867" from-port="0" to-layer="4870" to-port="1" /> + <edge from-layer="4868" from-port="0" to-layer="4870" to-port="2" /> + <edge from-layer="4869" from-port="0" to-layer="4870" to-port="3" /> + <edge from-layer="4870" from-port="4" to-layer="4871" to-port="1" /> + <edge from-layer="4871" from-port="2" to-layer="4872" to-port="0" /> + <edge from-layer="4872" from-port="1" to-layer="4874" to-port="0" /> + <edge from-layer="4873" from-port="0" to-layer="4874" to-port="2" /> + <edge from-layer="4874" from-port="3" to-layer="4946" to-port="0" /> + <edge from-layer="4874" from-port="3" to-layer="4875" to-port="0" /> + <edge from-layer="4875" from-port="1" to-layer="4878" to-port="0" /> + <edge from-layer="4876" from-port="0" to-layer="4878" to-port="1" /> + <edge from-layer="4877" from-port="0" to-layer="4878" to-port="2" /> + <edge from-layer="4878" from-port="3" to-layer="4880" to-port="0" /> + <edge from-layer="4878" from-port="3" to-layer="4970" to-port="0" /> + <edge from-layer="4879" from-port="0" to-layer="4880" to-port="1" /> + <edge from-layer="4880" from-port="2" to-layer="4881" to-port="1" /> + <edge from-layer="4881" from-port="2" to-layer="4883" to-port="2" /> + <edge from-layer="4881" from-port="2" to-layer="4911" to-port="2" /> + <edge from-layer="4882" from-port="0" to-layer="4883" to-port="3" /> + <edge from-layer="4883" from-port="4" to-layer="4885" to-port="0" /> + <edge from-layer="4884" from-port="0" to-layer="4885" to-port="2" /> + <edge from-layer="4885" from-port="3" to-layer="4886" to-port="0" /> + <edge from-layer="4886" from-port="2" to-layer="4887" to-port="1" /> + <edge from-layer="4886" from-port="2" to-layer="4923" to-port="1" /> + <edge from-layer="4887" from-port="2" to-layer="4916" to-port="0" /> + <edge from-layer="4888" from-port="0" to-layer="4898" to-port="0" /> + <edge from-layer="4889" from-port="0" to-layer="4898" to-port="1" /> + <edge from-layer="4890" from-port="1" to-layer="4892" to-port="0" /> + <edge from-layer="4891" from-port="0" to-layer="4892" to-port="2" /> + <edge from-layer="4892" from-port="3" to-layer="4893" to-port="0" /> + <edge from-layer="4893" from-port="2" to-layer="4894" to-port="0" /> + <edge from-layer="4894" from-port="1" to-layer="4896" to-port="0" /> + <edge from-layer="4895" from-port="0" to-layer="4896" to-port="1" /> + <edge from-layer="4896" from-port="2" to-layer="4898" to-port="2" /> + <edge from-layer="4897" from-port="0" to-layer="4898" to-port="3" /> + <edge from-layer="4898" from-port="4" to-layer="4906" to-port="2" /> + <edge from-layer="4898" from-port="4" to-layer="4901" to-port="1" /> + <edge from-layer="4899" from-port="0" to-layer="4901" to-port="2" /> + <edge from-layer="4900" from-port="0" to-layer="4901" to-port="3" /> + <edge from-layer="4901" from-port="4" to-layer="4903" to-port="0" /> + <edge from-layer="4902" from-port="0" to-layer="4903" to-port="1" /> + <edge from-layer="4903" from-port="2" to-layer="4907" to-port="0" /> + <edge from-layer="4904" from-port="0" to-layer="4906" to-port="1" /> + <edge from-layer="4905" from-port="0" to-layer="4906" to-port="3" /> + <edge from-layer="4906" from-port="4" to-layer="4907" to-port="1" /> + <edge from-layer="4907" from-port="2" to-layer="4915" to-port="0" /> + <edge from-layer="4908" from-port="0" to-layer="4911" to-port="0" /> + <edge from-layer="4909" from-port="0" to-layer="4911" to-port="1" /> + <edge from-layer="4910" from-port="0" to-layer="4911" to-port="3" /> + <edge from-layer="4911" from-port="4" to-layer="4913" to-port="0" /> + <edge from-layer="4912" from-port="0" to-layer="4913" to-port="2" /> + <edge from-layer="4913" from-port="3" to-layer="4914" to-port="0" /> + <edge from-layer="4914" from-port="2" to-layer="4944" to-port="1" /> + <edge from-layer="4914" from-port="2" to-layer="4915" to-port="1" /> + <edge from-layer="4915" from-port="2" to-layer="4916" to-port="1" /> + <edge from-layer="4916" from-port="2" to-layer="4971" to-port="0" /> + <edge from-layer="4916" from-port="2" to-layer="5007" to-port="0" /> + <edge from-layer="4917" from-port="0" to-layer="4918" to-port="1" /> + <edge from-layer="4918" from-port="2" to-layer="4922" to-port="0" /> + <edge from-layer="4919" from-port="0" to-layer="4922" to-port="1" /> + <edge from-layer="4920" from-port="0" to-layer="4922" to-port="2" /> + <edge from-layer="4921" from-port="0" to-layer="4922" to-port="3" /> + <edge from-layer="4922" from-port="4" to-layer="4926" to-port="0" /> + <edge from-layer="4922" from-port="4" to-layer="4942" to-port="0" /> + <edge from-layer="4922" from-port="4" to-layer="4923" to-port="0" /> + <edge from-layer="4922" from-port="4" to-layer="4937" to-port="0" /> + <edge from-layer="4923" from-port="2" to-layer="4945" to-port="0" /> + <edge from-layer="4924" from-port="0" to-layer="4934" to-port="0" /> + <edge from-layer="4925" from-port="0" to-layer="4934" to-port="1" /> + <edge from-layer="4926" from-port="1" to-layer="4928" to-port="0" /> + <edge from-layer="4927" from-port="0" to-layer="4928" to-port="2" /> + <edge from-layer="4928" from-port="3" to-layer="4929" to-port="0" /> + <edge from-layer="4929" from-port="2" to-layer="4930" to-port="0" /> + <edge from-layer="4930" from-port="1" to-layer="4932" to-port="0" /> + <edge from-layer="4931" from-port="0" to-layer="4932" to-port="1" /> + <edge from-layer="4932" from-port="2" to-layer="4934" to-port="2" /> + <edge from-layer="4933" from-port="0" to-layer="4934" to-port="3" /> + <edge from-layer="4934" from-port="4" to-layer="4937" to-port="1" /> + <edge from-layer="4934" from-port="4" to-layer="4942" to-port="2" /> + <edge from-layer="4935" from-port="0" to-layer="4937" to-port="2" /> + <edge from-layer="4936" from-port="0" to-layer="4937" to-port="3" /> + <edge from-layer="4937" from-port="4" to-layer="4939" to-port="0" /> + <edge from-layer="4938" from-port="0" to-layer="4939" to-port="1" /> + <edge from-layer="4939" from-port="2" to-layer="4943" to-port="0" /> + <edge from-layer="4940" from-port="0" to-layer="4942" to-port="1" /> + <edge from-layer="4941" from-port="0" to-layer="4942" to-port="3" /> + <edge from-layer="4942" from-port="4" to-layer="4943" to-port="1" /> + <edge from-layer="4943" from-port="2" to-layer="4944" to-port="0" /> + <edge from-layer="4944" from-port="2" to-layer="4945" to-port="1" /> + <edge from-layer="4945" from-port="2" to-layer="4966" to-port="0" /> + <edge from-layer="4945" from-port="2" to-layer="4946" to-port="1" /> + <edge from-layer="4946" from-port="2" to-layer="5007" to-port="1" /> + <edge from-layer="4946" from-port="2" to-layer="7212" to-port="0" /> + <edge from-layer="4947" from-port="0" to-layer="4952" to-port="0" /> + <edge from-layer="4948" from-port="0" to-layer="4951" to-port="1" /> + <edge from-layer="4949" from-port="0" to-layer="4951" to-port="2" /> + <edge from-layer="4950" from-port="0" to-layer="4951" to-port="3" /> + <edge from-layer="4951" from-port="4" to-layer="4952" to-port="1" /> + <edge from-layer="4952" from-port="2" to-layer="4953" to-port="0" /> + <edge from-layer="4953" from-port="1" to-layer="4955" to-port="0" /> + <edge from-layer="4954" from-port="0" to-layer="4955" to-port="2" /> + <edge from-layer="4955" from-port="3" to-layer="4962" to-port="0" /> + <edge from-layer="4956" from-port="0" to-layer="4959" to-port="1" /> + <edge from-layer="4957" from-port="0" to-layer="4959" to-port="2" /> + <edge from-layer="4958" from-port="0" to-layer="4959" to-port="3" /> + <edge from-layer="4959" from-port="4" to-layer="4961" to-port="0" /> + <edge from-layer="4960" from-port="0" to-layer="4961" to-port="1" /> + <edge from-layer="4961" from-port="2" to-layer="4962" to-port="1" /> + <edge from-layer="4962" from-port="2" to-layer="7211" to-port="0" /> + <edge from-layer="4962" from-port="2" to-layer="5007" to-port="2" /> + <edge from-layer="4963" from-port="0" to-layer="4985" to-port="0" /> + <edge from-layer="4964" from-port="0" to-layer="4979" to-port="0" /> + <edge from-layer="4965" from-port="0" to-layer="4979" to-port="1" /> + <edge from-layer="4965" from-port="0" to-layer="4983" to-port="1" /> + <edge from-layer="4966" from-port="1" to-layer="4969" to-port="0" /> + <edge from-layer="4967" from-port="0" to-layer="4969" to-port="1" /> + <edge from-layer="4968" from-port="0" to-layer="4969" to-port="2" /> + <edge from-layer="4969" from-port="3" to-layer="4970" to-port="1" /> + <edge from-layer="4970" from-port="2" to-layer="4982" to-port="0" /> + <edge from-layer="4970" from-port="2" to-layer="4975" to-port="0" /> + <edge from-layer="4971" from-port="1" to-layer="4974" to-port="0" /> + <edge from-layer="4971" from-port="1" to-layer="5000" to-port="0" /> + <edge from-layer="4972" from-port="0" to-layer="4974" to-port="1" /> + <edge from-layer="4973" from-port="0" to-layer="4974" to-port="2" /> + <edge from-layer="4974" from-port="3" to-layer="4975" to-port="1" /> + <edge from-layer="4975" from-port="2" to-layer="4977" to-port="0" /> + <edge from-layer="4976" from-port="0" to-layer="4977" to-port="1" /> + <edge from-layer="4977" from-port="2" to-layer="4979" to-port="2" /> + <edge from-layer="4978" from-port="0" to-layer="4983" to-port="3" /> + <edge from-layer="4978" from-port="0" to-layer="4979" to-port="3" /> + <edge from-layer="4979" from-port="4" to-layer="4985" to-port="1" /> + <edge from-layer="4980" from-port="0" to-layer="4983" to-port="0" /> + <edge from-layer="4981" from-port="0" to-layer="4982" to-port="1" /> + <edge from-layer="4982" from-port="2" to-layer="4990" to-port="2" /> + <edge from-layer="4982" from-port="2" to-layer="4983" to-port="2" /> + <edge from-layer="4983" from-port="4" to-layer="4985" to-port="2" /> + <edge from-layer="4984" from-port="0" to-layer="4985" to-port="3" /> + <edge from-layer="4985" from-port="4" to-layer="4992" to-port="0" /> + <edge from-layer="4986" from-port="0" to-layer="4992" to-port="1" /> + <edge from-layer="4987" from-port="0" to-layer="4990" to-port="0" /> + <edge from-layer="4988" from-port="0" to-layer="4990" to-port="1" /> + <edge from-layer="4989" from-port="0" to-layer="4990" to-port="3" /> + <edge from-layer="4990" from-port="4" to-layer="4992" to-port="2" /> + <edge from-layer="4991" from-port="0" to-layer="4992" to-port="3" /> + <edge from-layer="4992" from-port="4" to-layer="4995" to-port="0" /> + <edge from-layer="4993" from-port="0" to-layer="4995" to-port="1" /> + <edge from-layer="4994" from-port="0" to-layer="4995" to-port="2" /> + <edge from-layer="4995" from-port="3" to-layer="4996" to-port="0" /> + <edge from-layer="4996" from-port="2" to-layer="5006" to-port="0" /> + <edge from-layer="4996" from-port="2" to-layer="4997" to-port="0" /> + <edge from-layer="4997" from-port="1" to-layer="5005" to-port="0" /> + <edge from-layer="4998" from-port="0" to-layer="5000" to-port="1" /> + <edge from-layer="4999" from-port="0" to-layer="5000" to-port="2" /> + <edge from-layer="5000" from-port="3" to-layer="5004" to-port="0" /> + <edge from-layer="5001" from-port="0" to-layer="5004" to-port="1" /> + <edge from-layer="5002" from-port="0" to-layer="5004" to-port="2" /> + <edge from-layer="5003" from-port="0" to-layer="5004" to-port="3" /> + <edge from-layer="5004" from-port="4" to-layer="5005" to-port="1" /> + <edge from-layer="5005" from-port="2" to-layer="5006" to-port="1" /> + <edge from-layer="5006" from-port="2" to-layer="5007" to-port="3" /> + <edge from-layer="5007" from-port="4" to-layer="5009" to-port="0" /> + <edge from-layer="5008" from-port="0" to-layer="5009" to-port="1" /> + <edge from-layer="5009" from-port="2" to-layer="5011" to-port="0" /> + <edge from-layer="5010" from-port="0" to-layer="5011" to-port="1" /> + <edge from-layer="5011" from-port="2" to-layer="5020" to-port="0" /> + <edge from-layer="5012" from-port="0" to-layer="5013" to-port="0" /> + <edge from-layer="5013" from-port="1" to-layer="5016" to-port="0" /> + <edge from-layer="5014" from-port="0" to-layer="5015" to-port="0" /> + <edge from-layer="5015" from-port="1" to-layer="5016" to-port="1" /> + <edge from-layer="5016" from-port="2" to-layer="5018" to-port="0" /> + <edge from-layer="5017" from-port="0" to-layer="5018" to-port="1" /> + <edge from-layer="5018" from-port="2" to-layer="5019" to-port="0" /> + <edge from-layer="5019" from-port="1" to-layer="5020" to-port="1" /> + <edge from-layer="5020" from-port="2" to-layer="5022" to-port="0" /> + <edge from-layer="5021" from-port="0" to-layer="5022" to-port="1" /> + <edge from-layer="5022" from-port="2" to-layer="5023" to-port="0" /> + <edge from-layer="5023" from-port="2" to-layer="5053" to-port="1" /> + <edge from-layer="5023" from-port="2" to-layer="5025" to-port="0" /> + <edge from-layer="5024" from-port="0" to-layer="5025" to-port="1" /> + <edge from-layer="5025" from-port="2" to-layer="5027" to-port="0" /> + <edge from-layer="5026" from-port="0" to-layer="5027" to-port="1" /> + <edge from-layer="5027" from-port="2" to-layer="5029" to-port="0" /> + <edge from-layer="5028" from-port="0" to-layer="5029" to-port="1" /> + <edge from-layer="5029" from-port="2" to-layer="5038" to-port="0" /> + <edge from-layer="5030" from-port="0" to-layer="5031" to-port="0" /> + <edge from-layer="5031" from-port="1" to-layer="5034" to-port="0" /> + <edge from-layer="5032" from-port="0" to-layer="5033" to-port="0" /> + <edge from-layer="5033" from-port="1" to-layer="5034" to-port="1" /> + <edge from-layer="5034" from-port="2" to-layer="5036" to-port="0" /> + <edge from-layer="5035" from-port="0" to-layer="5036" to-port="1" /> + <edge from-layer="5036" from-port="2" to-layer="5037" to-port="0" /> + <edge from-layer="5037" from-port="1" to-layer="5038" to-port="1" /> + <edge from-layer="5038" from-port="2" to-layer="5040" to-port="0" /> + <edge from-layer="5039" from-port="0" to-layer="5040" to-port="1" /> + <edge from-layer="5040" from-port="2" to-layer="5041" to-port="0" /> + <edge from-layer="5041" from-port="1" to-layer="5050" to-port="0" /> + <edge from-layer="5042" from-port="0" to-layer="5043" to-port="0" /> + <edge from-layer="5043" from-port="1" to-layer="5046" to-port="0" /> + <edge from-layer="5044" from-port="0" to-layer="5045" to-port="0" /> + <edge from-layer="5045" from-port="1" to-layer="5046" to-port="1" /> + <edge from-layer="5046" from-port="2" to-layer="5048" to-port="0" /> + <edge from-layer="5047" from-port="0" to-layer="5048" to-port="1" /> + <edge from-layer="5048" from-port="2" to-layer="5049" to-port="0" /> + <edge from-layer="5049" from-port="1" to-layer="5050" to-port="1" /> + <edge from-layer="5050" from-port="2" to-layer="5052" to-port="0" /> + <edge from-layer="5051" from-port="0" to-layer="5052" to-port="1" /> + <edge from-layer="5052" from-port="2" to-layer="5053" to-port="0" /> + <edge from-layer="5053" from-port="2" to-layer="5250" to-port="1" /> + <edge from-layer="5053" from-port="2" to-layer="5055" to-port="0" /> + <edge from-layer="5054" from-port="0" to-layer="5055" to-port="1" /> + <edge from-layer="5055" from-port="2" to-layer="5057" to-port="0" /> + <edge from-layer="5056" from-port="0" to-layer="5057" to-port="1" /> + <edge from-layer="5057" from-port="2" to-layer="5059" to-port="0" /> + <edge from-layer="5058" from-port="0" to-layer="5059" to-port="1" /> + <edge from-layer="5059" from-port="2" to-layer="5068" to-port="0" /> + <edge from-layer="5060" from-port="0" to-layer="5061" to-port="0" /> + <edge from-layer="5061" from-port="1" to-layer="5064" to-port="0" /> + <edge from-layer="5062" from-port="0" to-layer="5063" to-port="0" /> + <edge from-layer="5063" from-port="1" to-layer="5064" to-port="1" /> + <edge from-layer="5064" from-port="2" to-layer="5066" to-port="0" /> + <edge from-layer="5065" from-port="0" to-layer="5066" to-port="1" /> + <edge from-layer="5066" from-port="2" to-layer="5067" to-port="0" /> + <edge from-layer="5067" from-port="1" to-layer="5068" to-port="1" /> + <edge from-layer="5068" from-port="2" to-layer="5070" to-port="0" /> + <edge from-layer="5069" from-port="0" to-layer="5070" to-port="1" /> + <edge from-layer="5070" from-port="2" to-layer="5072" to-port="0" /> + <edge from-layer="5071" from-port="0" to-layer="5072" to-port="1" /> + <edge from-layer="5072" from-port="2" to-layer="5076" to-port="0" /> + <edge from-layer="5072" from-port="2" to-layer="5088" to-port="0" /> + <edge from-layer="5072" from-port="2" to-layer="5186" to-port="0" /> + <edge from-layer="5073" from-port="0" to-layer="5076" to-port="1" /> + <edge from-layer="5074" from-port="0" to-layer="5076" to-port="2" /> + <edge from-layer="5075" from-port="0" to-layer="5076" to-port="3" /> + <edge from-layer="5076" from-port="4" to-layer="5078" to-port="0" /> + <edge from-layer="5077" from-port="0" to-layer="5078" to-port="1" /> + <edge from-layer="5078" from-port="2" to-layer="5082" to-port="0" /> + <edge from-layer="5079" from-port="0" to-layer="5082" to-port="1" /> + <edge from-layer="5080" from-port="0" to-layer="5082" to-port="2" /> + <edge from-layer="5081" from-port="0" to-layer="5082" to-port="3" /> + <edge from-layer="5082" from-port="4" to-layer="5114" to-port="0" /> + <edge from-layer="5082" from-port="4" to-layer="5133" to-port="0" /> + <edge from-layer="5082" from-port="4" to-layer="5128" to-port="0" /> + <edge from-layer="5082" from-port="4" to-layer="5117" to-port="0" /> + <edge from-layer="5083" from-port="0" to-layer="5110" to-port="0" /> + <edge from-layer="5084" from-port="0" to-layer="5110" to-port="1" /> + <edge from-layer="5085" from-port="0" to-layer="5088" to-port="1" /> + <edge from-layer="5086" from-port="0" to-layer="5088" to-port="2" /> + <edge from-layer="5087" from-port="0" to-layer="5088" to-port="3" /> + <edge from-layer="5088" from-port="4" to-layer="5145" to-port="0" /> + <edge from-layer="5088" from-port="4" to-layer="5089" to-port="0" /> + <edge from-layer="5089" from-port="1" to-layer="5092" to-port="0" /> + <edge from-layer="5090" from-port="0" to-layer="5092" to-port="1" /> + <edge from-layer="5091" from-port="0" to-layer="5092" to-port="2" /> + <edge from-layer="5092" from-port="3" to-layer="5108" to-port="0" /> + <edge from-layer="5093" from-port="0" to-layer="5098" to-port="0" /> + <edge from-layer="5094" from-port="0" to-layer="5097" to-port="1" /> + <edge from-layer="5095" from-port="0" to-layer="5097" to-port="2" /> + <edge from-layer="5096" from-port="0" to-layer="5097" to-port="3" /> + <edge from-layer="5097" from-port="4" to-layer="5098" to-port="1" /> + <edge from-layer="5098" from-port="2" to-layer="5099" to-port="0" /> + <edge from-layer="5099" from-port="1" to-layer="5101" to-port="0" /> + <edge from-layer="5100" from-port="0" to-layer="5101" to-port="2" /> + <edge from-layer="5101" from-port="3" to-layer="5102" to-port="0" /> + <edge from-layer="5101" from-port="3" to-layer="5173" to-port="0" /> + <edge from-layer="5102" from-port="1" to-layer="5105" to-port="0" /> + <edge from-layer="5103" from-port="0" to-layer="5105" to-port="1" /> + <edge from-layer="5104" from-port="0" to-layer="5105" to-port="2" /> + <edge from-layer="5105" from-port="3" to-layer="5107" to-port="0" /> + <edge from-layer="5105" from-port="3" to-layer="5197" to-port="0" /> + <edge from-layer="5106" from-port="0" to-layer="5107" to-port="1" /> + <edge from-layer="5107" from-port="2" to-layer="5108" to-port="1" /> + <edge from-layer="5108" from-port="2" to-layer="5110" to-port="2" /> + <edge from-layer="5108" from-port="2" to-layer="5138" to-port="2" /> + <edge from-layer="5109" from-port="0" to-layer="5110" to-port="3" /> + <edge from-layer="5110" from-port="4" to-layer="5112" to-port="0" /> + <edge from-layer="5111" from-port="0" to-layer="5112" to-port="2" /> + <edge from-layer="5112" from-port="3" to-layer="5113" to-port="0" /> + <edge from-layer="5113" from-port="2" to-layer="5114" to-port="1" /> + <edge from-layer="5113" from-port="2" to-layer="5150" to-port="1" /> + <edge from-layer="5114" from-port="2" to-layer="5143" to-port="0" /> + <edge from-layer="5115" from-port="0" to-layer="5125" to-port="0" /> + <edge from-layer="5116" from-port="0" to-layer="5125" to-port="1" /> + <edge from-layer="5117" from-port="1" to-layer="5119" to-port="0" /> + <edge from-layer="5118" from-port="0" to-layer="5119" to-port="2" /> + <edge from-layer="5119" from-port="3" to-layer="5120" to-port="0" /> + <edge from-layer="5120" from-port="2" to-layer="5121" to-port="0" /> + <edge from-layer="5121" from-port="1" to-layer="5123" to-port="0" /> + <edge from-layer="5122" from-port="0" to-layer="5123" to-port="1" /> + <edge from-layer="5123" from-port="2" to-layer="5125" to-port="2" /> + <edge from-layer="5124" from-port="0" to-layer="5125" to-port="3" /> + <edge from-layer="5125" from-port="4" to-layer="5128" to-port="1" /> + <edge from-layer="5125" from-port="4" to-layer="5133" to-port="2" /> + <edge from-layer="5126" from-port="0" to-layer="5128" to-port="2" /> + <edge from-layer="5127" from-port="0" to-layer="5128" to-port="3" /> + <edge from-layer="5128" from-port="4" to-layer="5130" to-port="0" /> + <edge from-layer="5129" from-port="0" to-layer="5130" to-port="1" /> + <edge from-layer="5130" from-port="2" to-layer="5134" to-port="0" /> + <edge from-layer="5131" from-port="0" to-layer="5133" to-port="1" /> + <edge from-layer="5132" from-port="0" to-layer="5133" to-port="3" /> + <edge from-layer="5133" from-port="4" to-layer="5134" to-port="1" /> + <edge from-layer="5134" from-port="2" to-layer="5142" to-port="0" /> + <edge from-layer="5135" from-port="0" to-layer="5138" to-port="0" /> + <edge from-layer="5136" from-port="0" to-layer="5138" to-port="1" /> + <edge from-layer="5137" from-port="0" to-layer="5138" to-port="3" /> + <edge from-layer="5138" from-port="4" to-layer="5140" to-port="0" /> + <edge from-layer="5139" from-port="0" to-layer="5140" to-port="2" /> + <edge from-layer="5140" from-port="3" to-layer="5141" to-port="0" /> + <edge from-layer="5141" from-port="2" to-layer="5142" to-port="1" /> + <edge from-layer="5141" from-port="2" to-layer="5171" to-port="1" /> + <edge from-layer="5142" from-port="2" to-layer="5143" to-port="1" /> + <edge from-layer="5143" from-port="2" to-layer="5234" to-port="0" /> + <edge from-layer="5143" from-port="2" to-layer="5198" to-port="0" /> + <edge from-layer="5144" from-port="0" to-layer="5145" to-port="1" /> + <edge from-layer="5145" from-port="2" to-layer="5149" to-port="0" /> + <edge from-layer="5146" from-port="0" to-layer="5149" to-port="1" /> + <edge from-layer="5147" from-port="0" to-layer="5149" to-port="2" /> + <edge from-layer="5148" from-port="0" to-layer="5149" to-port="3" /> + <edge from-layer="5149" from-port="4" to-layer="5169" to-port="0" /> + <edge from-layer="5149" from-port="4" to-layer="5150" to-port="0" /> + <edge from-layer="5149" from-port="4" to-layer="5153" to-port="0" /> + <edge from-layer="5149" from-port="4" to-layer="5164" to-port="0" /> + <edge from-layer="5150" from-port="2" to-layer="5172" to-port="0" /> + <edge from-layer="5151" from-port="0" to-layer="5161" to-port="0" /> + <edge from-layer="5152" from-port="0" to-layer="5161" to-port="1" /> + <edge from-layer="5153" from-port="1" to-layer="5155" to-port="0" /> + <edge from-layer="5154" from-port="0" to-layer="5155" to-port="2" /> + <edge from-layer="5155" from-port="3" to-layer="5156" to-port="0" /> + <edge from-layer="5156" from-port="2" to-layer="5157" to-port="0" /> + <edge from-layer="5157" from-port="1" to-layer="5159" to-port="0" /> + <edge from-layer="5158" from-port="0" to-layer="5159" to-port="1" /> + <edge from-layer="5159" from-port="2" to-layer="5161" to-port="2" /> + <edge from-layer="5160" from-port="0" to-layer="5161" to-port="3" /> + <edge from-layer="5161" from-port="4" to-layer="5164" to-port="1" /> + <edge from-layer="5161" from-port="4" to-layer="5169" to-port="2" /> + <edge from-layer="5162" from-port="0" to-layer="5164" to-port="2" /> + <edge from-layer="5163" from-port="0" to-layer="5164" to-port="3" /> + <edge from-layer="5164" from-port="4" to-layer="5166" to-port="0" /> + <edge from-layer="5165" from-port="0" to-layer="5166" to-port="1" /> + <edge from-layer="5166" from-port="2" to-layer="5170" to-port="0" /> + <edge from-layer="5167" from-port="0" to-layer="5169" to-port="1" /> + <edge from-layer="5168" from-port="0" to-layer="5169" to-port="3" /> + <edge from-layer="5169" from-port="4" to-layer="5170" to-port="1" /> + <edge from-layer="5170" from-port="2" to-layer="5171" to-port="0" /> + <edge from-layer="5171" from-port="2" to-layer="5172" to-port="1" /> + <edge from-layer="5172" from-port="2" to-layer="5193" to-port="0" /> + <edge from-layer="5172" from-port="2" to-layer="5173" to-port="1" /> + <edge from-layer="5173" from-port="2" to-layer="5234" to-port="1" /> + <edge from-layer="5173" from-port="2" to-layer="7210" to-port="0" /> + <edge from-layer="5174" from-port="0" to-layer="5179" to-port="0" /> + <edge from-layer="5175" from-port="0" to-layer="5178" to-port="1" /> + <edge from-layer="5176" from-port="0" to-layer="5178" to-port="2" /> + <edge from-layer="5177" from-port="0" to-layer="5178" to-port="3" /> + <edge from-layer="5178" from-port="4" to-layer="5179" to-port="1" /> + <edge from-layer="5179" from-port="2" to-layer="5180" to-port="0" /> + <edge from-layer="5180" from-port="1" to-layer="5182" to-port="0" /> + <edge from-layer="5181" from-port="0" to-layer="5182" to-port="2" /> + <edge from-layer="5182" from-port="3" to-layer="5189" to-port="0" /> + <edge from-layer="5183" from-port="0" to-layer="5186" to-port="1" /> + <edge from-layer="5184" from-port="0" to-layer="5186" to-port="2" /> + <edge from-layer="5185" from-port="0" to-layer="5186" to-port="3" /> + <edge from-layer="5186" from-port="4" to-layer="5188" to-port="0" /> + <edge from-layer="5187" from-port="0" to-layer="5188" to-port="1" /> + <edge from-layer="5188" from-port="2" to-layer="5189" to-port="1" /> + <edge from-layer="5189" from-port="2" to-layer="7209" to-port="0" /> + <edge from-layer="5189" from-port="2" to-layer="5234" to-port="2" /> + <edge from-layer="5190" from-port="0" to-layer="5212" to-port="0" /> + <edge from-layer="5191" from-port="0" to-layer="5206" to-port="0" /> + <edge from-layer="5192" from-port="0" to-layer="5210" to-port="1" /> + <edge from-layer="5192" from-port="0" to-layer="5206" to-port="1" /> + <edge from-layer="5193" from-port="1" to-layer="5196" to-port="0" /> + <edge from-layer="5194" from-port="0" to-layer="5196" to-port="1" /> + <edge from-layer="5195" from-port="0" to-layer="5196" to-port="2" /> + <edge from-layer="5196" from-port="3" to-layer="5197" to-port="1" /> + <edge from-layer="5197" from-port="2" to-layer="5209" to-port="0" /> + <edge from-layer="5197" from-port="2" to-layer="5202" to-port="0" /> + <edge from-layer="5198" from-port="1" to-layer="5201" to-port="0" /> + <edge from-layer="5198" from-port="1" to-layer="5227" to-port="0" /> + <edge from-layer="5199" from-port="0" to-layer="5201" to-port="1" /> + <edge from-layer="5200" from-port="0" to-layer="5201" to-port="2" /> + <edge from-layer="5201" from-port="3" to-layer="5202" to-port="1" /> + <edge from-layer="5202" from-port="2" to-layer="5204" to-port="0" /> + <edge from-layer="5203" from-port="0" to-layer="5204" to-port="1" /> + <edge from-layer="5204" from-port="2" to-layer="5206" to-port="2" /> + <edge from-layer="5205" from-port="0" to-layer="5210" to-port="3" /> + <edge from-layer="5205" from-port="0" to-layer="5206" to-port="3" /> + <edge from-layer="5206" from-port="4" to-layer="5212" to-port="1" /> + <edge from-layer="5207" from-port="0" to-layer="5210" to-port="0" /> + <edge from-layer="5208" from-port="0" to-layer="5209" to-port="1" /> + <edge from-layer="5209" from-port="2" to-layer="5217" to-port="2" /> + <edge from-layer="5209" from-port="2" to-layer="5210" to-port="2" /> + <edge from-layer="5210" from-port="4" to-layer="5212" to-port="2" /> + <edge from-layer="5211" from-port="0" to-layer="5212" to-port="3" /> + <edge from-layer="5212" from-port="4" to-layer="5219" to-port="0" /> + <edge from-layer="5213" from-port="0" to-layer="5219" to-port="1" /> + <edge from-layer="5214" from-port="0" to-layer="5217" to-port="0" /> + <edge from-layer="5215" from-port="0" to-layer="5217" to-port="1" /> + <edge from-layer="5216" from-port="0" to-layer="5217" to-port="3" /> + <edge from-layer="5217" from-port="4" to-layer="5219" to-port="2" /> + <edge from-layer="5218" from-port="0" to-layer="5219" to-port="3" /> + <edge from-layer="5219" from-port="4" to-layer="5222" to-port="0" /> + <edge from-layer="5220" from-port="0" to-layer="5222" to-port="1" /> + <edge from-layer="5221" from-port="0" to-layer="5222" to-port="2" /> + <edge from-layer="5222" from-port="3" to-layer="5223" to-port="0" /> + <edge from-layer="5223" from-port="2" to-layer="5224" to-port="0" /> + <edge from-layer="5223" from-port="2" to-layer="5233" to-port="0" /> + <edge from-layer="5224" from-port="1" to-layer="5232" to-port="0" /> + <edge from-layer="5225" from-port="0" to-layer="5227" to-port="1" /> + <edge from-layer="5226" from-port="0" to-layer="5227" to-port="2" /> + <edge from-layer="5227" from-port="3" to-layer="5231" to-port="0" /> + <edge from-layer="5228" from-port="0" to-layer="5231" to-port="1" /> + <edge from-layer="5229" from-port="0" to-layer="5231" to-port="2" /> + <edge from-layer="5230" from-port="0" to-layer="5231" to-port="3" /> + <edge from-layer="5231" from-port="4" to-layer="5232" to-port="1" /> + <edge from-layer="5232" from-port="2" to-layer="5233" to-port="1" /> + <edge from-layer="5233" from-port="2" to-layer="5234" to-port="3" /> + <edge from-layer="5234" from-port="4" to-layer="5236" to-port="0" /> + <edge from-layer="5235" from-port="0" to-layer="5236" to-port="1" /> + <edge from-layer="5236" from-port="2" to-layer="5238" to-port="0" /> + <edge from-layer="5237" from-port="0" to-layer="5238" to-port="1" /> + <edge from-layer="5238" from-port="2" to-layer="5247" to-port="0" /> + <edge from-layer="5239" from-port="0" to-layer="5240" to-port="0" /> + <edge from-layer="5240" from-port="1" to-layer="5243" to-port="0" /> + <edge from-layer="5241" from-port="0" to-layer="5242" to-port="0" /> + <edge from-layer="5242" from-port="1" to-layer="5243" to-port="1" /> + <edge from-layer="5243" from-port="2" to-layer="5245" to-port="0" /> + <edge from-layer="5244" from-port="0" to-layer="5245" to-port="1" /> + <edge from-layer="5245" from-port="2" to-layer="5246" to-port="0" /> + <edge from-layer="5246" from-port="1" to-layer="5247" to-port="1" /> + <edge from-layer="5247" from-port="2" to-layer="5249" to-port="0" /> + <edge from-layer="5248" from-port="0" to-layer="5249" to-port="1" /> + <edge from-layer="5249" from-port="2" to-layer="5250" to-port="0" /> + <edge from-layer="5250" from-port="2" to-layer="5252" to-port="0" /> + <edge from-layer="5250" from-port="2" to-layer="5280" to-port="1" /> + <edge from-layer="5251" from-port="0" to-layer="5252" to-port="1" /> + <edge from-layer="5252" from-port="2" to-layer="5254" to-port="0" /> + <edge from-layer="5253" from-port="0" to-layer="5254" to-port="1" /> + <edge from-layer="5254" from-port="2" to-layer="5256" to-port="0" /> + <edge from-layer="5255" from-port="0" to-layer="5256" to-port="1" /> + <edge from-layer="5256" from-port="2" to-layer="5265" to-port="0" /> + <edge from-layer="5257" from-port="0" to-layer="5258" to-port="0" /> + <edge from-layer="5258" from-port="1" to-layer="5261" to-port="0" /> + <edge from-layer="5259" from-port="0" to-layer="5260" to-port="0" /> + <edge from-layer="5260" from-port="1" to-layer="5261" to-port="1" /> + <edge from-layer="5261" from-port="2" to-layer="5263" to-port="0" /> + <edge from-layer="5262" from-port="0" to-layer="5263" to-port="1" /> + <edge from-layer="5263" from-port="2" to-layer="5264" to-port="0" /> + <edge from-layer="5264" from-port="1" to-layer="5265" to-port="1" /> + <edge from-layer="5265" from-port="2" to-layer="5267" to-port="0" /> + <edge from-layer="5266" from-port="0" to-layer="5267" to-port="1" /> + <edge from-layer="5267" from-port="2" to-layer="5268" to-port="0" /> + <edge from-layer="5268" from-port="1" to-layer="5277" to-port="0" /> + <edge from-layer="5269" from-port="0" to-layer="5270" to-port="0" /> + <edge from-layer="5270" from-port="1" to-layer="5273" to-port="0" /> + <edge from-layer="5271" from-port="0" to-layer="5272" to-port="0" /> + <edge from-layer="5272" from-port="1" to-layer="5273" to-port="1" /> + <edge from-layer="5273" from-port="2" to-layer="5275" to-port="0" /> + <edge from-layer="5274" from-port="0" to-layer="5275" to-port="1" /> + <edge from-layer="5275" from-port="2" to-layer="5276" to-port="0" /> + <edge from-layer="5276" from-port="1" to-layer="5277" to-port="1" /> + <edge from-layer="5277" from-port="2" to-layer="5279" to-port="0" /> + <edge from-layer="5278" from-port="0" to-layer="5279" to-port="1" /> + <edge from-layer="5279" from-port="2" to-layer="5280" to-port="0" /> + <edge from-layer="5280" from-port="2" to-layer="5477" to-port="1" /> + <edge from-layer="5280" from-port="2" to-layer="5282" to-port="0" /> + <edge from-layer="5281" from-port="0" to-layer="5282" to-port="1" /> + <edge from-layer="5282" from-port="2" to-layer="5284" to-port="0" /> + <edge from-layer="5283" from-port="0" to-layer="5284" to-port="1" /> + <edge from-layer="5284" from-port="2" to-layer="5286" to-port="0" /> + <edge from-layer="5285" from-port="0" to-layer="5286" to-port="1" /> + <edge from-layer="5286" from-port="2" to-layer="5295" to-port="0" /> + <edge from-layer="5287" from-port="0" to-layer="5288" to-port="0" /> + <edge from-layer="5288" from-port="1" to-layer="5291" to-port="0" /> + <edge from-layer="5289" from-port="0" to-layer="5290" to-port="0" /> + <edge from-layer="5290" from-port="1" to-layer="5291" to-port="1" /> + <edge from-layer="5291" from-port="2" to-layer="5293" to-port="0" /> + <edge from-layer="5292" from-port="0" to-layer="5293" to-port="1" /> + <edge from-layer="5293" from-port="2" to-layer="5294" to-port="0" /> + <edge from-layer="5294" from-port="1" to-layer="5295" to-port="1" /> + <edge from-layer="5295" from-port="2" to-layer="5297" to-port="0" /> + <edge from-layer="5296" from-port="0" to-layer="5297" to-port="1" /> + <edge from-layer="5297" from-port="2" to-layer="5299" to-port="0" /> + <edge from-layer="5298" from-port="0" to-layer="5299" to-port="1" /> + <edge from-layer="5299" from-port="2" to-layer="5303" to-port="0" /> + <edge from-layer="5299" from-port="2" to-layer="5413" to-port="0" /> + <edge from-layer="5299" from-port="2" to-layer="5315" to-port="0" /> + <edge from-layer="5300" from-port="0" to-layer="5303" to-port="1" /> + <edge from-layer="5301" from-port="0" to-layer="5303" to-port="2" /> + <edge from-layer="5302" from-port="0" to-layer="5303" to-port="3" /> + <edge from-layer="5303" from-port="4" to-layer="5305" to-port="0" /> + <edge from-layer="5304" from-port="0" to-layer="5305" to-port="1" /> + <edge from-layer="5305" from-port="2" to-layer="5309" to-port="0" /> + <edge from-layer="5306" from-port="0" to-layer="5309" to-port="1" /> + <edge from-layer="5307" from-port="0" to-layer="5309" to-port="2" /> + <edge from-layer="5308" from-port="0" to-layer="5309" to-port="3" /> + <edge from-layer="5309" from-port="4" to-layer="5355" to-port="0" /> + <edge from-layer="5309" from-port="4" to-layer="5341" to-port="0" /> + <edge from-layer="5309" from-port="4" to-layer="5344" to-port="0" /> + <edge from-layer="5309" from-port="4" to-layer="5360" to-port="0" /> + <edge from-layer="5310" from-port="0" to-layer="5337" to-port="0" /> + <edge from-layer="5311" from-port="0" to-layer="5337" to-port="1" /> + <edge from-layer="5312" from-port="0" to-layer="5315" to-port="1" /> + <edge from-layer="5313" from-port="0" to-layer="5315" to-port="2" /> + <edge from-layer="5314" from-port="0" to-layer="5315" to-port="3" /> + <edge from-layer="5315" from-port="4" to-layer="5316" to-port="0" /> + <edge from-layer="5315" from-port="4" to-layer="5372" to-port="0" /> + <edge from-layer="5316" from-port="1" to-layer="5319" to-port="0" /> + <edge from-layer="5317" from-port="0" to-layer="5319" to-port="1" /> + <edge from-layer="5318" from-port="0" to-layer="5319" to-port="2" /> + <edge from-layer="5319" from-port="3" to-layer="5335" to-port="0" /> + <edge from-layer="5320" from-port="0" to-layer="5325" to-port="0" /> + <edge from-layer="5321" from-port="0" to-layer="5324" to-port="1" /> + <edge from-layer="5322" from-port="0" to-layer="5324" to-port="2" /> + <edge from-layer="5323" from-port="0" to-layer="5324" to-port="3" /> + <edge from-layer="5324" from-port="4" to-layer="5325" to-port="1" /> + <edge from-layer="5325" from-port="2" to-layer="5326" to-port="0" /> + <edge from-layer="5326" from-port="1" to-layer="5328" to-port="0" /> + <edge from-layer="5327" from-port="0" to-layer="5328" to-port="2" /> + <edge from-layer="5328" from-port="3" to-layer="5400" to-port="0" /> + <edge from-layer="5328" from-port="3" to-layer="5329" to-port="0" /> + <edge from-layer="5329" from-port="1" to-layer="5332" to-port="0" /> + <edge from-layer="5330" from-port="0" to-layer="5332" to-port="1" /> + <edge from-layer="5331" from-port="0" to-layer="5332" to-port="2" /> + <edge from-layer="5332" from-port="3" to-layer="5334" to-port="0" /> + <edge from-layer="5332" from-port="3" to-layer="5424" to-port="0" /> + <edge from-layer="5333" from-port="0" to-layer="5334" to-port="1" /> + <edge from-layer="5334" from-port="2" to-layer="5335" to-port="1" /> + <edge from-layer="5335" from-port="2" to-layer="5365" to-port="2" /> + <edge from-layer="5335" from-port="2" to-layer="5337" to-port="2" /> + <edge from-layer="5336" from-port="0" to-layer="5337" to-port="3" /> + <edge from-layer="5337" from-port="4" to-layer="5339" to-port="0" /> + <edge from-layer="5338" from-port="0" to-layer="5339" to-port="2" /> + <edge from-layer="5339" from-port="3" to-layer="5340" to-port="0" /> + <edge from-layer="5340" from-port="2" to-layer="5341" to-port="1" /> + <edge from-layer="5340" from-port="2" to-layer="5377" to-port="1" /> + <edge from-layer="5341" from-port="2" to-layer="5370" to-port="0" /> + <edge from-layer="5342" from-port="0" to-layer="5352" to-port="0" /> + <edge from-layer="5343" from-port="0" to-layer="5352" to-port="1" /> + <edge from-layer="5344" from-port="1" to-layer="5346" to-port="0" /> + <edge from-layer="5345" from-port="0" to-layer="5346" to-port="2" /> + <edge from-layer="5346" from-port="3" to-layer="5347" to-port="0" /> + <edge from-layer="5347" from-port="2" to-layer="5348" to-port="0" /> + <edge from-layer="5348" from-port="1" to-layer="5350" to-port="0" /> + <edge from-layer="5349" from-port="0" to-layer="5350" to-port="1" /> + <edge from-layer="5350" from-port="2" to-layer="5352" to-port="2" /> + <edge from-layer="5351" from-port="0" to-layer="5352" to-port="3" /> + <edge from-layer="5352" from-port="4" to-layer="5355" to-port="1" /> + <edge from-layer="5352" from-port="4" to-layer="5360" to-port="2" /> + <edge from-layer="5353" from-port="0" to-layer="5355" to-port="2" /> + <edge from-layer="5354" from-port="0" to-layer="5355" to-port="3" /> + <edge from-layer="5355" from-port="4" to-layer="5357" to-port="0" /> + <edge from-layer="5356" from-port="0" to-layer="5357" to-port="1" /> + <edge from-layer="5357" from-port="2" to-layer="5361" to-port="0" /> + <edge from-layer="5358" from-port="0" to-layer="5360" to-port="1" /> + <edge from-layer="5359" from-port="0" to-layer="5360" to-port="3" /> + <edge from-layer="5360" from-port="4" to-layer="5361" to-port="1" /> + <edge from-layer="5361" from-port="2" to-layer="5369" to-port="0" /> + <edge from-layer="5362" from-port="0" to-layer="5365" to-port="0" /> + <edge from-layer="5363" from-port="0" to-layer="5365" to-port="1" /> + <edge from-layer="5364" from-port="0" to-layer="5365" to-port="3" /> + <edge from-layer="5365" from-port="4" to-layer="5367" to-port="0" /> + <edge from-layer="5366" from-port="0" to-layer="5367" to-port="2" /> + <edge from-layer="5367" from-port="3" to-layer="5368" to-port="0" /> + <edge from-layer="5368" from-port="2" to-layer="5369" to-port="1" /> + <edge from-layer="5368" from-port="2" to-layer="5398" to-port="1" /> + <edge from-layer="5369" from-port="2" to-layer="5370" to-port="1" /> + <edge from-layer="5370" from-port="2" to-layer="5461" to-port="0" /> + <edge from-layer="5370" from-port="2" to-layer="5425" to-port="0" /> + <edge from-layer="5371" from-port="0" to-layer="5372" to-port="1" /> + <edge from-layer="5372" from-port="2" to-layer="5376" to-port="0" /> + <edge from-layer="5373" from-port="0" to-layer="5376" to-port="1" /> + <edge from-layer="5374" from-port="0" to-layer="5376" to-port="2" /> + <edge from-layer="5375" from-port="0" to-layer="5376" to-port="3" /> + <edge from-layer="5376" from-port="4" to-layer="5380" to-port="0" /> + <edge from-layer="5376" from-port="4" to-layer="5377" to-port="0" /> + <edge from-layer="5376" from-port="4" to-layer="5396" to-port="0" /> + <edge from-layer="5376" from-port="4" to-layer="5391" to-port="0" /> + <edge from-layer="5377" from-port="2" to-layer="5399" to-port="0" /> + <edge from-layer="5378" from-port="0" to-layer="5388" to-port="0" /> + <edge from-layer="5379" from-port="0" to-layer="5388" to-port="1" /> + <edge from-layer="5380" from-port="1" to-layer="5382" to-port="0" /> + <edge from-layer="5381" from-port="0" to-layer="5382" to-port="2" /> + <edge from-layer="5382" from-port="3" to-layer="5383" to-port="0" /> + <edge from-layer="5383" from-port="2" to-layer="5384" to-port="0" /> + <edge from-layer="5384" from-port="1" to-layer="5386" to-port="0" /> + <edge from-layer="5385" from-port="0" to-layer="5386" to-port="1" /> + <edge from-layer="5386" from-port="2" to-layer="5388" to-port="2" /> + <edge from-layer="5387" from-port="0" to-layer="5388" to-port="3" /> + <edge from-layer="5388" from-port="4" to-layer="5391" to-port="1" /> + <edge from-layer="5388" from-port="4" to-layer="5396" to-port="2" /> + <edge from-layer="5389" from-port="0" to-layer="5391" to-port="2" /> + <edge from-layer="5390" from-port="0" to-layer="5391" to-port="3" /> + <edge from-layer="5391" from-port="4" to-layer="5393" to-port="0" /> + <edge from-layer="5392" from-port="0" to-layer="5393" to-port="1" /> + <edge from-layer="5393" from-port="2" to-layer="5397" to-port="0" /> + <edge from-layer="5394" from-port="0" to-layer="5396" to-port="1" /> + <edge from-layer="5395" from-port="0" to-layer="5396" to-port="3" /> + <edge from-layer="5396" from-port="4" to-layer="5397" to-port="1" /> + <edge from-layer="5397" from-port="2" to-layer="5398" to-port="0" /> + <edge from-layer="5398" from-port="2" to-layer="5399" to-port="1" /> + <edge from-layer="5399" from-port="2" to-layer="5400" to-port="1" /> + <edge from-layer="5399" from-port="2" to-layer="5420" to-port="0" /> + <edge from-layer="5400" from-port="2" to-layer="5461" to-port="1" /> + <edge from-layer="5400" from-port="2" to-layer="7208" to-port="0" /> + <edge from-layer="5401" from-port="0" to-layer="5406" to-port="0" /> + <edge from-layer="5402" from-port="0" to-layer="5405" to-port="1" /> + <edge from-layer="5403" from-port="0" to-layer="5405" to-port="2" /> + <edge from-layer="5404" from-port="0" to-layer="5405" to-port="3" /> + <edge from-layer="5405" from-port="4" to-layer="5406" to-port="1" /> + <edge from-layer="5406" from-port="2" to-layer="5407" to-port="0" /> + <edge from-layer="5407" from-port="1" to-layer="5409" to-port="0" /> + <edge from-layer="5408" from-port="0" to-layer="5409" to-port="2" /> + <edge from-layer="5409" from-port="3" to-layer="5416" to-port="0" /> + <edge from-layer="5410" from-port="0" to-layer="5413" to-port="1" /> + <edge from-layer="5411" from-port="0" to-layer="5413" to-port="2" /> + <edge from-layer="5412" from-port="0" to-layer="5413" to-port="3" /> + <edge from-layer="5413" from-port="4" to-layer="5415" to-port="0" /> + <edge from-layer="5414" from-port="0" to-layer="5415" to-port="1" /> + <edge from-layer="5415" from-port="2" to-layer="5416" to-port="1" /> + <edge from-layer="5416" from-port="2" to-layer="5461" to-port="2" /> + <edge from-layer="5416" from-port="2" to-layer="7207" to-port="0" /> + <edge from-layer="5417" from-port="0" to-layer="5439" to-port="0" /> + <edge from-layer="5418" from-port="0" to-layer="5433" to-port="0" /> + <edge from-layer="5419" from-port="0" to-layer="5437" to-port="1" /> + <edge from-layer="5419" from-port="0" to-layer="5433" to-port="1" /> + <edge from-layer="5420" from-port="1" to-layer="5423" to-port="0" /> + <edge from-layer="5421" from-port="0" to-layer="5423" to-port="1" /> + <edge from-layer="5422" from-port="0" to-layer="5423" to-port="2" /> + <edge from-layer="5423" from-port="3" to-layer="5424" to-port="1" /> + <edge from-layer="5424" from-port="2" to-layer="5429" to-port="0" /> + <edge from-layer="5424" from-port="2" to-layer="5436" to-port="0" /> + <edge from-layer="5425" from-port="1" to-layer="5428" to-port="0" /> + <edge from-layer="5425" from-port="1" to-layer="5454" to-port="0" /> + <edge from-layer="5426" from-port="0" to-layer="5428" to-port="1" /> + <edge from-layer="5427" from-port="0" to-layer="5428" to-port="2" /> + <edge from-layer="5428" from-port="3" to-layer="5429" to-port="1" /> + <edge from-layer="5429" from-port="2" to-layer="5431" to-port="0" /> + <edge from-layer="5430" from-port="0" to-layer="5431" to-port="1" /> + <edge from-layer="5431" from-port="2" to-layer="5433" to-port="2" /> + <edge from-layer="5432" from-port="0" to-layer="5437" to-port="3" /> + <edge from-layer="5432" from-port="0" to-layer="5433" to-port="3" /> + <edge from-layer="5433" from-port="4" to-layer="5439" to-port="1" /> + <edge from-layer="5434" from-port="0" to-layer="5437" to-port="0" /> + <edge from-layer="5435" from-port="0" to-layer="5436" to-port="1" /> + <edge from-layer="5436" from-port="2" to-layer="5437" to-port="2" /> + <edge from-layer="5436" from-port="2" to-layer="5444" to-port="2" /> + <edge from-layer="5437" from-port="4" to-layer="5439" to-port="2" /> + <edge from-layer="5438" from-port="0" to-layer="5439" to-port="3" /> + <edge from-layer="5439" from-port="4" to-layer="5446" to-port="0" /> + <edge from-layer="5440" from-port="0" to-layer="5446" to-port="1" /> + <edge from-layer="5441" from-port="0" to-layer="5444" to-port="0" /> + <edge from-layer="5442" from-port="0" to-layer="5444" to-port="1" /> + <edge from-layer="5443" from-port="0" to-layer="5444" to-port="3" /> + <edge from-layer="5444" from-port="4" to-layer="5446" to-port="2" /> + <edge from-layer="5445" from-port="0" to-layer="5446" to-port="3" /> + <edge from-layer="5446" from-port="4" to-layer="5449" to-port="0" /> + <edge from-layer="5447" from-port="0" to-layer="5449" to-port="1" /> + <edge from-layer="5448" from-port="0" to-layer="5449" to-port="2" /> + <edge from-layer="5449" from-port="3" to-layer="5450" to-port="0" /> + <edge from-layer="5450" from-port="2" to-layer="5460" to-port="0" /> + <edge from-layer="5450" from-port="2" to-layer="5451" to-port="0" /> + <edge from-layer="5451" from-port="1" to-layer="5459" to-port="0" /> + <edge from-layer="5452" from-port="0" to-layer="5454" to-port="1" /> + <edge from-layer="5453" from-port="0" to-layer="5454" to-port="2" /> + <edge from-layer="5454" from-port="3" to-layer="5458" to-port="0" /> + <edge from-layer="5455" from-port="0" to-layer="5458" to-port="1" /> + <edge from-layer="5456" from-port="0" to-layer="5458" to-port="2" /> + <edge from-layer="5457" from-port="0" to-layer="5458" to-port="3" /> + <edge from-layer="5458" from-port="4" to-layer="5459" to-port="1" /> + <edge from-layer="5459" from-port="2" to-layer="5460" to-port="1" /> + <edge from-layer="5460" from-port="2" to-layer="5461" to-port="3" /> + <edge from-layer="5461" from-port="4" to-layer="5463" to-port="0" /> + <edge from-layer="5462" from-port="0" to-layer="5463" to-port="1" /> + <edge from-layer="5463" from-port="2" to-layer="5465" to-port="0" /> + <edge from-layer="5464" from-port="0" to-layer="5465" to-port="1" /> + <edge from-layer="5465" from-port="2" to-layer="5474" to-port="0" /> + <edge from-layer="5466" from-port="0" to-layer="5467" to-port="0" /> + <edge from-layer="5467" from-port="1" to-layer="5470" to-port="0" /> + <edge from-layer="5468" from-port="0" to-layer="5469" to-port="0" /> + <edge from-layer="5469" from-port="1" to-layer="5470" to-port="1" /> + <edge from-layer="5470" from-port="2" to-layer="5472" to-port="0" /> + <edge from-layer="5471" from-port="0" to-layer="5472" to-port="1" /> + <edge from-layer="5472" from-port="2" to-layer="5473" to-port="0" /> + <edge from-layer="5473" from-port="1" to-layer="5474" to-port="1" /> + <edge from-layer="5474" from-port="2" to-layer="5476" to-port="0" /> + <edge from-layer="5475" from-port="0" to-layer="5476" to-port="1" /> + <edge from-layer="5476" from-port="2" to-layer="5477" to-port="0" /> + <edge from-layer="5477" from-port="2" to-layer="5479" to-port="0" /> + <edge from-layer="5477" from-port="2" to-layer="5507" to-port="1" /> + <edge from-layer="5478" from-port="0" to-layer="5479" to-port="1" /> + <edge from-layer="5479" from-port="2" to-layer="5481" to-port="0" /> + <edge from-layer="5480" from-port="0" to-layer="5481" to-port="1" /> + <edge from-layer="5481" from-port="2" to-layer="5483" to-port="0" /> + <edge from-layer="5482" from-port="0" to-layer="5483" to-port="1" /> + <edge from-layer="5483" from-port="2" to-layer="5492" to-port="0" /> + <edge from-layer="5484" from-port="0" to-layer="5485" to-port="0" /> + <edge from-layer="5485" from-port="1" to-layer="5488" to-port="0" /> + <edge from-layer="5486" from-port="0" to-layer="5487" to-port="0" /> + <edge from-layer="5487" from-port="1" to-layer="5488" to-port="1" /> + <edge from-layer="5488" from-port="2" to-layer="5490" to-port="0" /> + <edge from-layer="5489" from-port="0" to-layer="5490" to-port="1" /> + <edge from-layer="5490" from-port="2" to-layer="5491" to-port="0" /> + <edge from-layer="5491" from-port="1" to-layer="5492" to-port="1" /> + <edge from-layer="5492" from-port="2" to-layer="5494" to-port="0" /> + <edge from-layer="5493" from-port="0" to-layer="5494" to-port="1" /> + <edge from-layer="5494" from-port="2" to-layer="5495" to-port="0" /> + <edge from-layer="5495" from-port="1" to-layer="5504" to-port="0" /> + <edge from-layer="5496" from-port="0" to-layer="5497" to-port="0" /> + <edge from-layer="5497" from-port="1" to-layer="5500" to-port="0" /> + <edge from-layer="5498" from-port="0" to-layer="5499" to-port="0" /> + <edge from-layer="5499" from-port="1" to-layer="5500" to-port="1" /> + <edge from-layer="5500" from-port="2" to-layer="5502" to-port="0" /> + <edge from-layer="5501" from-port="0" to-layer="5502" to-port="1" /> + <edge from-layer="5502" from-port="2" to-layer="5503" to-port="0" /> + <edge from-layer="5503" from-port="1" to-layer="5504" to-port="1" /> + <edge from-layer="5504" from-port="2" to-layer="5506" to-port="0" /> + <edge from-layer="5505" from-port="0" to-layer="5506" to-port="1" /> + <edge from-layer="5506" from-port="2" to-layer="5507" to-port="0" /> + <edge from-layer="5507" from-port="2" to-layer="5704" to-port="1" /> + <edge from-layer="5507" from-port="2" to-layer="5509" to-port="0" /> + <edge from-layer="5508" from-port="0" to-layer="5509" to-port="1" /> + <edge from-layer="5509" from-port="2" to-layer="5511" to-port="0" /> + <edge from-layer="5510" from-port="0" to-layer="5511" to-port="1" /> + <edge from-layer="5511" from-port="2" to-layer="5513" to-port="0" /> + <edge from-layer="5512" from-port="0" to-layer="5513" to-port="1" /> + <edge from-layer="5513" from-port="2" to-layer="5522" to-port="0" /> + <edge from-layer="5514" from-port="0" to-layer="5515" to-port="0" /> + <edge from-layer="5515" from-port="1" to-layer="5518" to-port="0" /> + <edge from-layer="5516" from-port="0" to-layer="5517" to-port="0" /> + <edge from-layer="5517" from-port="1" to-layer="5518" to-port="1" /> + <edge from-layer="5518" from-port="2" to-layer="5520" to-port="0" /> + <edge from-layer="5519" from-port="0" to-layer="5520" to-port="1" /> + <edge from-layer="5520" from-port="2" to-layer="5521" to-port="0" /> + <edge from-layer="5521" from-port="1" to-layer="5522" to-port="1" /> + <edge from-layer="5522" from-port="2" to-layer="5524" to-port="0" /> + <edge from-layer="5523" from-port="0" to-layer="5524" to-port="1" /> + <edge from-layer="5524" from-port="2" to-layer="5526" to-port="0" /> + <edge from-layer="5525" from-port="0" to-layer="5526" to-port="1" /> + <edge from-layer="5526" from-port="2" to-layer="5530" to-port="0" /> + <edge from-layer="5526" from-port="2" to-layer="5640" to-port="0" /> + <edge from-layer="5526" from-port="2" to-layer="5542" to-port="0" /> + <edge from-layer="5527" from-port="0" to-layer="5530" to-port="1" /> + <edge from-layer="5528" from-port="0" to-layer="5530" to-port="2" /> + <edge from-layer="5529" from-port="0" to-layer="5530" to-port="3" /> + <edge from-layer="5530" from-port="4" to-layer="5532" to-port="0" /> + <edge from-layer="5531" from-port="0" to-layer="5532" to-port="1" /> + <edge from-layer="5532" from-port="2" to-layer="5536" to-port="0" /> + <edge from-layer="5533" from-port="0" to-layer="5536" to-port="1" /> + <edge from-layer="5534" from-port="0" to-layer="5536" to-port="2" /> + <edge from-layer="5535" from-port="0" to-layer="5536" to-port="3" /> + <edge from-layer="5536" from-port="4" to-layer="5582" to-port="0" /> + <edge from-layer="5536" from-port="4" to-layer="5587" to-port="0" /> + <edge from-layer="5536" from-port="4" to-layer="5571" to-port="0" /> + <edge from-layer="5536" from-port="4" to-layer="5568" to-port="0" /> + <edge from-layer="5537" from-port="0" to-layer="5564" to-port="0" /> + <edge from-layer="5538" from-port="0" to-layer="5564" to-port="1" /> + <edge from-layer="5539" from-port="0" to-layer="5542" to-port="1" /> + <edge from-layer="5540" from-port="0" to-layer="5542" to-port="2" /> + <edge from-layer="5541" from-port="0" to-layer="5542" to-port="3" /> + <edge from-layer="5542" from-port="4" to-layer="5543" to-port="0" /> + <edge from-layer="5542" from-port="4" to-layer="5599" to-port="0" /> + <edge from-layer="5543" from-port="1" to-layer="5546" to-port="0" /> + <edge from-layer="5544" from-port="0" to-layer="5546" to-port="1" /> + <edge from-layer="5545" from-port="0" to-layer="5546" to-port="2" /> + <edge from-layer="5546" from-port="3" to-layer="5562" to-port="0" /> + <edge from-layer="5547" from-port="0" to-layer="5552" to-port="0" /> + <edge from-layer="5548" from-port="0" to-layer="5551" to-port="1" /> + <edge from-layer="5549" from-port="0" to-layer="5551" to-port="2" /> + <edge from-layer="5550" from-port="0" to-layer="5551" to-port="3" /> + <edge from-layer="5551" from-port="4" to-layer="5552" to-port="1" /> + <edge from-layer="5552" from-port="2" to-layer="5553" to-port="0" /> + <edge from-layer="5553" from-port="1" to-layer="5555" to-port="0" /> + <edge from-layer="5554" from-port="0" to-layer="5555" to-port="2" /> + <edge from-layer="5555" from-port="3" to-layer="5556" to-port="0" /> + <edge from-layer="5555" from-port="3" to-layer="5627" to-port="0" /> + <edge from-layer="5556" from-port="1" to-layer="5559" to-port="0" /> + <edge from-layer="5557" from-port="0" to-layer="5559" to-port="1" /> + <edge from-layer="5558" from-port="0" to-layer="5559" to-port="2" /> + <edge from-layer="5559" from-port="3" to-layer="5561" to-port="0" /> + <edge from-layer="5559" from-port="3" to-layer="5651" to-port="0" /> + <edge from-layer="5560" from-port="0" to-layer="5561" to-port="1" /> + <edge from-layer="5561" from-port="2" to-layer="5562" to-port="1" /> + <edge from-layer="5562" from-port="2" to-layer="5564" to-port="2" /> + <edge from-layer="5562" from-port="2" to-layer="5592" to-port="2" /> + <edge from-layer="5563" from-port="0" to-layer="5564" to-port="3" /> + <edge from-layer="5564" from-port="4" to-layer="5566" to-port="0" /> + <edge from-layer="5565" from-port="0" to-layer="5566" to-port="2" /> + <edge from-layer="5566" from-port="3" to-layer="5567" to-port="0" /> + <edge from-layer="5567" from-port="2" to-layer="5568" to-port="1" /> + <edge from-layer="5567" from-port="2" to-layer="5604" to-port="1" /> + <edge from-layer="5568" from-port="2" to-layer="5597" to-port="0" /> + <edge from-layer="5569" from-port="0" to-layer="5579" to-port="0" /> + <edge from-layer="5570" from-port="0" to-layer="5579" to-port="1" /> + <edge from-layer="5571" from-port="1" to-layer="5573" to-port="0" /> + <edge from-layer="5572" from-port="0" to-layer="5573" to-port="2" /> + <edge from-layer="5573" from-port="3" to-layer="5574" to-port="0" /> + <edge from-layer="5574" from-port="2" to-layer="5575" to-port="0" /> + <edge from-layer="5575" from-port="1" to-layer="5577" to-port="0" /> + <edge from-layer="5576" from-port="0" to-layer="5577" to-port="1" /> + <edge from-layer="5577" from-port="2" to-layer="5579" to-port="2" /> + <edge from-layer="5578" from-port="0" to-layer="5579" to-port="3" /> + <edge from-layer="5579" from-port="4" to-layer="5587" to-port="2" /> + <edge from-layer="5579" from-port="4" to-layer="5582" to-port="1" /> + <edge from-layer="5580" from-port="0" to-layer="5582" to-port="2" /> + <edge from-layer="5581" from-port="0" to-layer="5582" to-port="3" /> + <edge from-layer="5582" from-port="4" to-layer="5584" to-port="0" /> + <edge from-layer="5583" from-port="0" to-layer="5584" to-port="1" /> + <edge from-layer="5584" from-port="2" to-layer="5588" to-port="0" /> + <edge from-layer="5585" from-port="0" to-layer="5587" to-port="1" /> + <edge from-layer="5586" from-port="0" to-layer="5587" to-port="3" /> + <edge from-layer="5587" from-port="4" to-layer="5588" to-port="1" /> + <edge from-layer="5588" from-port="2" to-layer="5596" to-port="0" /> + <edge from-layer="5589" from-port="0" to-layer="5592" to-port="0" /> + <edge from-layer="5590" from-port="0" to-layer="5592" to-port="1" /> + <edge from-layer="5591" from-port="0" to-layer="5592" to-port="3" /> + <edge from-layer="5592" from-port="4" to-layer="5594" to-port="0" /> + <edge from-layer="5593" from-port="0" to-layer="5594" to-port="2" /> + <edge from-layer="5594" from-port="3" to-layer="5595" to-port="0" /> + <edge from-layer="5595" from-port="2" to-layer="5596" to-port="1" /> + <edge from-layer="5595" from-port="2" to-layer="5625" to-port="1" /> + <edge from-layer="5596" from-port="2" to-layer="5597" to-port="1" /> + <edge from-layer="5597" from-port="2" to-layer="5688" to-port="0" /> + <edge from-layer="5597" from-port="2" to-layer="5652" to-port="0" /> + <edge from-layer="5598" from-port="0" to-layer="5599" to-port="1" /> + <edge from-layer="5599" from-port="2" to-layer="5603" to-port="0" /> + <edge from-layer="5600" from-port="0" to-layer="5603" to-port="1" /> + <edge from-layer="5601" from-port="0" to-layer="5603" to-port="2" /> + <edge from-layer="5602" from-port="0" to-layer="5603" to-port="3" /> + <edge from-layer="5603" from-port="4" to-layer="5604" to-port="0" /> + <edge from-layer="5603" from-port="4" to-layer="5607" to-port="0" /> + <edge from-layer="5603" from-port="4" to-layer="5623" to-port="0" /> + <edge from-layer="5603" from-port="4" to-layer="5618" to-port="0" /> + <edge from-layer="5604" from-port="2" to-layer="5626" to-port="0" /> + <edge from-layer="5605" from-port="0" to-layer="5615" to-port="0" /> + <edge from-layer="5606" from-port="0" to-layer="5615" to-port="1" /> + <edge from-layer="5607" from-port="1" to-layer="5609" to-port="0" /> + <edge from-layer="5608" from-port="0" to-layer="5609" to-port="2" /> + <edge from-layer="5609" from-port="3" to-layer="5610" to-port="0" /> + <edge from-layer="5610" from-port="2" to-layer="5611" to-port="0" /> + <edge from-layer="5611" from-port="1" to-layer="5613" to-port="0" /> + <edge from-layer="5612" from-port="0" to-layer="5613" to-port="1" /> + <edge from-layer="5613" from-port="2" to-layer="5615" to-port="2" /> + <edge from-layer="5614" from-port="0" to-layer="5615" to-port="3" /> + <edge from-layer="5615" from-port="4" to-layer="5618" to-port="1" /> + <edge from-layer="5615" from-port="4" to-layer="5623" to-port="2" /> + <edge from-layer="5616" from-port="0" to-layer="5618" to-port="2" /> + <edge from-layer="5617" from-port="0" to-layer="5618" to-port="3" /> + <edge from-layer="5618" from-port="4" to-layer="5620" to-port="0" /> + <edge from-layer="5619" from-port="0" to-layer="5620" to-port="1" /> + <edge from-layer="5620" from-port="2" to-layer="5624" to-port="0" /> + <edge from-layer="5621" from-port="0" to-layer="5623" to-port="1" /> + <edge from-layer="5622" from-port="0" to-layer="5623" to-port="3" /> + <edge from-layer="5623" from-port="4" to-layer="5624" to-port="1" /> + <edge from-layer="5624" from-port="2" to-layer="5625" to-port="0" /> + <edge from-layer="5625" from-port="2" to-layer="5626" to-port="1" /> + <edge from-layer="5626" from-port="2" to-layer="5647" to-port="0" /> + <edge from-layer="5626" from-port="2" to-layer="5627" to-port="1" /> + <edge from-layer="5627" from-port="2" to-layer="7206" to-port="0" /> + <edge from-layer="5627" from-port="2" to-layer="5688" to-port="1" /> + <edge from-layer="5628" from-port="0" to-layer="5633" to-port="0" /> + <edge from-layer="5629" from-port="0" to-layer="5632" to-port="1" /> + <edge from-layer="5630" from-port="0" to-layer="5632" to-port="2" /> + <edge from-layer="5631" from-port="0" to-layer="5632" to-port="3" /> + <edge from-layer="5632" from-port="4" to-layer="5633" to-port="1" /> + <edge from-layer="5633" from-port="2" to-layer="5634" to-port="0" /> + <edge from-layer="5634" from-port="1" to-layer="5636" to-port="0" /> + <edge from-layer="5635" from-port="0" to-layer="5636" to-port="2" /> + <edge from-layer="5636" from-port="3" to-layer="5643" to-port="0" /> + <edge from-layer="5637" from-port="0" to-layer="5640" to-port="1" /> + <edge from-layer="5638" from-port="0" to-layer="5640" to-port="2" /> + <edge from-layer="5639" from-port="0" to-layer="5640" to-port="3" /> + <edge from-layer="5640" from-port="4" to-layer="5642" to-port="0" /> + <edge from-layer="5641" from-port="0" to-layer="5642" to-port="1" /> + <edge from-layer="5642" from-port="2" to-layer="5643" to-port="1" /> + <edge from-layer="5643" from-port="2" to-layer="7205" to-port="0" /> + <edge from-layer="5643" from-port="2" to-layer="5688" to-port="2" /> + <edge from-layer="5644" from-port="0" to-layer="5666" to-port="0" /> + <edge from-layer="5645" from-port="0" to-layer="5660" to-port="0" /> + <edge from-layer="5646" from-port="0" to-layer="5660" to-port="1" /> + <edge from-layer="5646" from-port="0" to-layer="5664" to-port="1" /> + <edge from-layer="5647" from-port="1" to-layer="5650" to-port="0" /> + <edge from-layer="5648" from-port="0" to-layer="5650" to-port="1" /> + <edge from-layer="5649" from-port="0" to-layer="5650" to-port="2" /> + <edge from-layer="5650" from-port="3" to-layer="5651" to-port="1" /> + <edge from-layer="5651" from-port="2" to-layer="5663" to-port="0" /> + <edge from-layer="5651" from-port="2" to-layer="5656" to-port="0" /> + <edge from-layer="5652" from-port="1" to-layer="5655" to-port="0" /> + <edge from-layer="5652" from-port="1" to-layer="5681" to-port="0" /> + <edge from-layer="5653" from-port="0" to-layer="5655" to-port="1" /> + <edge from-layer="5654" from-port="0" to-layer="5655" to-port="2" /> + <edge from-layer="5655" from-port="3" to-layer="5656" to-port="1" /> + <edge from-layer="5656" from-port="2" to-layer="5658" to-port="0" /> + <edge from-layer="5657" from-port="0" to-layer="5658" to-port="1" /> + <edge from-layer="5658" from-port="2" to-layer="5660" to-port="2" /> + <edge from-layer="5659" from-port="0" to-layer="5664" to-port="3" /> + <edge from-layer="5659" from-port="0" to-layer="5660" to-port="3" /> + <edge from-layer="5660" from-port="4" to-layer="5666" to-port="1" /> + <edge from-layer="5661" from-port="0" to-layer="5664" to-port="0" /> + <edge from-layer="5662" from-port="0" to-layer="5663" to-port="1" /> + <edge from-layer="5663" from-port="2" to-layer="5671" to-port="2" /> + <edge from-layer="5663" from-port="2" to-layer="5664" to-port="2" /> + <edge from-layer="5664" from-port="4" to-layer="5666" to-port="2" /> + <edge from-layer="5665" from-port="0" to-layer="5666" to-port="3" /> + <edge from-layer="5666" from-port="4" to-layer="5673" to-port="0" /> + <edge from-layer="5667" from-port="0" to-layer="5673" to-port="1" /> + <edge from-layer="5668" from-port="0" to-layer="5671" to-port="0" /> + <edge from-layer="5669" from-port="0" to-layer="5671" to-port="1" /> + <edge from-layer="5670" from-port="0" to-layer="5671" to-port="3" /> + <edge from-layer="5671" from-port="4" to-layer="5673" to-port="2" /> + <edge from-layer="5672" from-port="0" to-layer="5673" to-port="3" /> + <edge from-layer="5673" from-port="4" to-layer="5676" to-port="0" /> + <edge from-layer="5674" from-port="0" to-layer="5676" to-port="1" /> + <edge from-layer="5675" from-port="0" to-layer="5676" to-port="2" /> + <edge from-layer="5676" from-port="3" to-layer="5677" to-port="0" /> + <edge from-layer="5677" from-port="2" to-layer="5678" to-port="0" /> + <edge from-layer="5677" from-port="2" to-layer="5687" to-port="0" /> + <edge from-layer="5678" from-port="1" to-layer="5686" to-port="0" /> + <edge from-layer="5679" from-port="0" to-layer="5681" to-port="1" /> + <edge from-layer="5680" from-port="0" to-layer="5681" to-port="2" /> + <edge from-layer="5681" from-port="3" to-layer="5685" to-port="0" /> + <edge from-layer="5682" from-port="0" to-layer="5685" to-port="1" /> + <edge from-layer="5683" from-port="0" to-layer="5685" to-port="2" /> + <edge from-layer="5684" from-port="0" to-layer="5685" to-port="3" /> + <edge from-layer="5685" from-port="4" to-layer="5686" to-port="1" /> + <edge from-layer="5686" from-port="2" to-layer="5687" to-port="1" /> + <edge from-layer="5687" from-port="2" to-layer="5688" to-port="3" /> + <edge from-layer="5688" from-port="4" to-layer="5690" to-port="0" /> + <edge from-layer="5689" from-port="0" to-layer="5690" to-port="1" /> + <edge from-layer="5690" from-port="2" to-layer="5692" to-port="0" /> + <edge from-layer="5691" from-port="0" to-layer="5692" to-port="1" /> + <edge from-layer="5692" from-port="2" to-layer="5701" to-port="0" /> + <edge from-layer="5693" from-port="0" to-layer="5694" to-port="0" /> + <edge from-layer="5694" from-port="1" to-layer="5697" to-port="0" /> + <edge from-layer="5695" from-port="0" to-layer="5696" to-port="0" /> + <edge from-layer="5696" from-port="1" to-layer="5697" to-port="1" /> + <edge from-layer="5697" from-port="2" to-layer="5699" to-port="0" /> + <edge from-layer="5698" from-port="0" to-layer="5699" to-port="1" /> + <edge from-layer="5699" from-port="2" to-layer="5700" to-port="0" /> + <edge from-layer="5700" from-port="1" to-layer="5701" to-port="1" /> + <edge from-layer="5701" from-port="2" to-layer="5703" to-port="0" /> + <edge from-layer="5702" from-port="0" to-layer="5703" to-port="1" /> + <edge from-layer="5703" from-port="2" to-layer="5704" to-port="0" /> + <edge from-layer="5704" from-port="2" to-layer="5734" to-port="1" /> + <edge from-layer="5704" from-port="2" to-layer="5706" to-port="0" /> + <edge from-layer="5705" from-port="0" to-layer="5706" to-port="1" /> + <edge from-layer="5706" from-port="2" to-layer="5708" to-port="0" /> + <edge from-layer="5707" from-port="0" to-layer="5708" to-port="1" /> + <edge from-layer="5708" from-port="2" to-layer="5710" to-port="0" /> + <edge from-layer="5709" from-port="0" to-layer="5710" to-port="1" /> + <edge from-layer="5710" from-port="2" to-layer="5719" to-port="0" /> + <edge from-layer="5711" from-port="0" to-layer="5712" to-port="0" /> + <edge from-layer="5712" from-port="1" to-layer="5715" to-port="0" /> + <edge from-layer="5713" from-port="0" to-layer="5714" to-port="0" /> + <edge from-layer="5714" from-port="1" to-layer="5715" to-port="1" /> + <edge from-layer="5715" from-port="2" to-layer="5717" to-port="0" /> + <edge from-layer="5716" from-port="0" to-layer="5717" to-port="1" /> + <edge from-layer="5717" from-port="2" to-layer="5718" to-port="0" /> + <edge from-layer="5718" from-port="1" to-layer="5719" to-port="1" /> + <edge from-layer="5719" from-port="2" to-layer="5721" to-port="0" /> + <edge from-layer="5720" from-port="0" to-layer="5721" to-port="1" /> + <edge from-layer="5721" from-port="2" to-layer="5722" to-port="0" /> + <edge from-layer="5722" from-port="1" to-layer="5731" to-port="0" /> + <edge from-layer="5723" from-port="0" to-layer="5724" to-port="0" /> + <edge from-layer="5724" from-port="1" to-layer="5727" to-port="0" /> + <edge from-layer="5725" from-port="0" to-layer="5726" to-port="0" /> + <edge from-layer="5726" from-port="1" to-layer="5727" to-port="1" /> + <edge from-layer="5727" from-port="2" to-layer="5729" to-port="0" /> + <edge from-layer="5728" from-port="0" to-layer="5729" to-port="1" /> + <edge from-layer="5729" from-port="2" to-layer="5730" to-port="0" /> + <edge from-layer="5730" from-port="1" to-layer="5731" to-port="1" /> + <edge from-layer="5731" from-port="2" to-layer="5733" to-port="0" /> + <edge from-layer="5732" from-port="0" to-layer="5733" to-port="1" /> + <edge from-layer="5733" from-port="2" to-layer="5734" to-port="0" /> + <edge from-layer="5734" from-port="2" to-layer="5736" to-port="0" /> + <edge from-layer="5734" from-port="2" to-layer="5931" to-port="1" /> + <edge from-layer="5735" from-port="0" to-layer="5736" to-port="1" /> + <edge from-layer="5736" from-port="2" to-layer="5738" to-port="0" /> + <edge from-layer="5737" from-port="0" to-layer="5738" to-port="1" /> + <edge from-layer="5738" from-port="2" to-layer="5740" to-port="0" /> + <edge from-layer="5739" from-port="0" to-layer="5740" to-port="1" /> + <edge from-layer="5740" from-port="2" to-layer="5749" to-port="0" /> + <edge from-layer="5741" from-port="0" to-layer="5742" to-port="0" /> + <edge from-layer="5742" from-port="1" to-layer="5745" to-port="0" /> + <edge from-layer="5743" from-port="0" to-layer="5744" to-port="0" /> + <edge from-layer="5744" from-port="1" to-layer="5745" to-port="1" /> + <edge from-layer="5745" from-port="2" to-layer="5747" to-port="0" /> + <edge from-layer="5746" from-port="0" to-layer="5747" to-port="1" /> + <edge from-layer="5747" from-port="2" to-layer="5748" to-port="0" /> + <edge from-layer="5748" from-port="1" to-layer="5749" to-port="1" /> + <edge from-layer="5749" from-port="2" to-layer="5751" to-port="0" /> + <edge from-layer="5750" from-port="0" to-layer="5751" to-port="1" /> + <edge from-layer="5751" from-port="2" to-layer="5753" to-port="0" /> + <edge from-layer="5752" from-port="0" to-layer="5753" to-port="1" /> + <edge from-layer="5753" from-port="2" to-layer="5867" to-port="0" /> + <edge from-layer="5753" from-port="2" to-layer="5769" to-port="0" /> + <edge from-layer="5753" from-port="2" to-layer="5757" to-port="0" /> + <edge from-layer="5754" from-port="0" to-layer="5757" to-port="1" /> + <edge from-layer="5755" from-port="0" to-layer="5757" to-port="2" /> + <edge from-layer="5756" from-port="0" to-layer="5757" to-port="3" /> + <edge from-layer="5757" from-port="4" to-layer="5759" to-port="0" /> + <edge from-layer="5758" from-port="0" to-layer="5759" to-port="1" /> + <edge from-layer="5759" from-port="2" to-layer="5763" to-port="0" /> + <edge from-layer="5760" from-port="0" to-layer="5763" to-port="1" /> + <edge from-layer="5761" from-port="0" to-layer="5763" to-port="2" /> + <edge from-layer="5762" from-port="0" to-layer="5763" to-port="3" /> + <edge from-layer="5763" from-port="4" to-layer="5814" to-port="0" /> + <edge from-layer="5763" from-port="4" to-layer="5795" to-port="0" /> + <edge from-layer="5763" from-port="4" to-layer="5798" to-port="0" /> + <edge from-layer="5763" from-port="4" to-layer="5809" to-port="0" /> + <edge from-layer="5764" from-port="0" to-layer="5791" to-port="0" /> + <edge from-layer="5765" from-port="0" to-layer="5791" to-port="1" /> + <edge from-layer="5766" from-port="0" to-layer="5769" to-port="1" /> + <edge from-layer="5767" from-port="0" to-layer="5769" to-port="2" /> + <edge from-layer="5768" from-port="0" to-layer="5769" to-port="3" /> + <edge from-layer="5769" from-port="4" to-layer="5770" to-port="0" /> + <edge from-layer="5769" from-port="4" to-layer="5826" to-port="0" /> + <edge from-layer="5770" from-port="1" to-layer="5773" to-port="0" /> + <edge from-layer="5771" from-port="0" to-layer="5773" to-port="1" /> + <edge from-layer="5772" from-port="0" to-layer="5773" to-port="2" /> + <edge from-layer="5773" from-port="3" to-layer="5789" to-port="0" /> + <edge from-layer="5774" from-port="0" to-layer="5779" to-port="0" /> + <edge from-layer="5775" from-port="0" to-layer="5778" to-port="1" /> + <edge from-layer="5776" from-port="0" to-layer="5778" to-port="2" /> + <edge from-layer="5777" from-port="0" to-layer="5778" to-port="3" /> + <edge from-layer="5778" from-port="4" to-layer="5779" to-port="1" /> + <edge from-layer="5779" from-port="2" to-layer="5780" to-port="0" /> + <edge from-layer="5780" from-port="1" to-layer="5782" to-port="0" /> + <edge from-layer="5781" from-port="0" to-layer="5782" to-port="2" /> + <edge from-layer="5782" from-port="3" to-layer="5783" to-port="0" /> + <edge from-layer="5782" from-port="3" to-layer="5854" to-port="0" /> + <edge from-layer="5783" from-port="1" to-layer="5786" to-port="0" /> + <edge from-layer="5784" from-port="0" to-layer="5786" to-port="1" /> + <edge from-layer="5785" from-port="0" to-layer="5786" to-port="2" /> + <edge from-layer="5786" from-port="3" to-layer="5878" to-port="0" /> + <edge from-layer="5786" from-port="3" to-layer="5788" to-port="0" /> + <edge from-layer="5787" from-port="0" to-layer="5788" to-port="1" /> + <edge from-layer="5788" from-port="2" to-layer="5789" to-port="1" /> + <edge from-layer="5789" from-port="2" to-layer="5791" to-port="2" /> + <edge from-layer="5789" from-port="2" to-layer="5819" to-port="2" /> + <edge from-layer="5790" from-port="0" to-layer="5791" to-port="3" /> + <edge from-layer="5791" from-port="4" to-layer="5793" to-port="0" /> + <edge from-layer="5792" from-port="0" to-layer="5793" to-port="2" /> + <edge from-layer="5793" from-port="3" to-layer="5794" to-port="0" /> + <edge from-layer="5794" from-port="2" to-layer="5831" to-port="1" /> + <edge from-layer="5794" from-port="2" to-layer="5795" to-port="1" /> + <edge from-layer="5795" from-port="2" to-layer="5824" to-port="0" /> + <edge from-layer="5796" from-port="0" to-layer="5806" to-port="0" /> + <edge from-layer="5797" from-port="0" to-layer="5806" to-port="1" /> + <edge from-layer="5798" from-port="1" to-layer="5800" to-port="0" /> + <edge from-layer="5799" from-port="0" to-layer="5800" to-port="2" /> + <edge from-layer="5800" from-port="3" to-layer="5801" to-port="0" /> + <edge from-layer="5801" from-port="2" to-layer="5802" to-port="0" /> + <edge from-layer="5802" from-port="1" to-layer="5804" to-port="0" /> + <edge from-layer="5803" from-port="0" to-layer="5804" to-port="1" /> + <edge from-layer="5804" from-port="2" to-layer="5806" to-port="2" /> + <edge from-layer="5805" from-port="0" to-layer="5806" to-port="3" /> + <edge from-layer="5806" from-port="4" to-layer="5809" to-port="1" /> + <edge from-layer="5806" from-port="4" to-layer="5814" to-port="2" /> + <edge from-layer="5807" from-port="0" to-layer="5809" to-port="2" /> + <edge from-layer="5808" from-port="0" to-layer="5809" to-port="3" /> + <edge from-layer="5809" from-port="4" to-layer="5811" to-port="0" /> + <edge from-layer="5810" from-port="0" to-layer="5811" to-port="1" /> + <edge from-layer="5811" from-port="2" to-layer="5815" to-port="0" /> + <edge from-layer="5812" from-port="0" to-layer="5814" to-port="1" /> + <edge from-layer="5813" from-port="0" to-layer="5814" to-port="3" /> + <edge from-layer="5814" from-port="4" to-layer="5815" to-port="1" /> + <edge from-layer="5815" from-port="2" to-layer="5823" to-port="0" /> + <edge from-layer="5816" from-port="0" to-layer="5819" to-port="0" /> + <edge from-layer="5817" from-port="0" to-layer="5819" to-port="1" /> + <edge from-layer="5818" from-port="0" to-layer="5819" to-port="3" /> + <edge from-layer="5819" from-port="4" to-layer="5821" to-port="0" /> + <edge from-layer="5820" from-port="0" to-layer="5821" to-port="2" /> + <edge from-layer="5821" from-port="3" to-layer="5822" to-port="0" /> + <edge from-layer="5822" from-port="2" to-layer="5852" to-port="1" /> + <edge from-layer="5822" from-port="2" to-layer="5823" to-port="1" /> + <edge from-layer="5823" from-port="2" to-layer="5824" to-port="1" /> + <edge from-layer="5824" from-port="2" to-layer="5915" to-port="0" /> + <edge from-layer="5824" from-port="2" to-layer="5879" to-port="0" /> + <edge from-layer="5825" from-port="0" to-layer="5826" to-port="1" /> + <edge from-layer="5826" from-port="2" to-layer="5830" to-port="0" /> + <edge from-layer="5827" from-port="0" to-layer="5830" to-port="1" /> + <edge from-layer="5828" from-port="0" to-layer="5830" to-port="2" /> + <edge from-layer="5829" from-port="0" to-layer="5830" to-port="3" /> + <edge from-layer="5830" from-port="4" to-layer="5831" to-port="0" /> + <edge from-layer="5830" from-port="4" to-layer="5834" to-port="0" /> + <edge from-layer="5830" from-port="4" to-layer="5850" to-port="0" /> + <edge from-layer="5830" from-port="4" to-layer="5845" to-port="0" /> + <edge from-layer="5831" from-port="2" to-layer="5853" to-port="0" /> + <edge from-layer="5832" from-port="0" to-layer="5842" to-port="0" /> + <edge from-layer="5833" from-port="0" to-layer="5842" to-port="1" /> + <edge from-layer="5834" from-port="1" to-layer="5836" to-port="0" /> + <edge from-layer="5835" from-port="0" to-layer="5836" to-port="2" /> + <edge from-layer="5836" from-port="3" to-layer="5837" to-port="0" /> + <edge from-layer="5837" from-port="2" to-layer="5838" to-port="0" /> + <edge from-layer="5838" from-port="1" to-layer="5840" to-port="0" /> + <edge from-layer="5839" from-port="0" to-layer="5840" to-port="1" /> + <edge from-layer="5840" from-port="2" to-layer="5842" to-port="2" /> + <edge from-layer="5841" from-port="0" to-layer="5842" to-port="3" /> + <edge from-layer="5842" from-port="4" to-layer="5845" to-port="1" /> + <edge from-layer="5842" from-port="4" to-layer="5850" to-port="2" /> + <edge from-layer="5843" from-port="0" to-layer="5845" to-port="2" /> + <edge from-layer="5844" from-port="0" to-layer="5845" to-port="3" /> + <edge from-layer="5845" from-port="4" to-layer="5847" to-port="0" /> + <edge from-layer="5846" from-port="0" to-layer="5847" to-port="1" /> + <edge from-layer="5847" from-port="2" to-layer="5851" to-port="0" /> + <edge from-layer="5848" from-port="0" to-layer="5850" to-port="1" /> + <edge from-layer="5849" from-port="0" to-layer="5850" to-port="3" /> + <edge from-layer="5850" from-port="4" to-layer="5851" to-port="1" /> + <edge from-layer="5851" from-port="2" to-layer="5852" to-port="0" /> + <edge from-layer="5852" from-port="2" to-layer="5853" to-port="1" /> + <edge from-layer="5853" from-port="2" to-layer="5854" to-port="1" /> + <edge from-layer="5853" from-port="2" to-layer="5874" to-port="0" /> + <edge from-layer="5854" from-port="2" to-layer="7204" to-port="0" /> + <edge from-layer="5854" from-port="2" to-layer="5915" to-port="1" /> + <edge from-layer="5855" from-port="0" to-layer="5860" to-port="0" /> + <edge from-layer="5856" from-port="0" to-layer="5859" to-port="1" /> + <edge from-layer="5857" from-port="0" to-layer="5859" to-port="2" /> + <edge from-layer="5858" from-port="0" to-layer="5859" to-port="3" /> + <edge from-layer="5859" from-port="4" to-layer="5860" to-port="1" /> + <edge from-layer="5860" from-port="2" to-layer="5861" to-port="0" /> + <edge from-layer="5861" from-port="1" to-layer="5863" to-port="0" /> + <edge from-layer="5862" from-port="0" to-layer="5863" to-port="2" /> + <edge from-layer="5863" from-port="3" to-layer="5870" to-port="0" /> + <edge from-layer="5864" from-port="0" to-layer="5867" to-port="1" /> + <edge from-layer="5865" from-port="0" to-layer="5867" to-port="2" /> + <edge from-layer="5866" from-port="0" to-layer="5867" to-port="3" /> + <edge from-layer="5867" from-port="4" to-layer="5869" to-port="0" /> + <edge from-layer="5868" from-port="0" to-layer="5869" to-port="1" /> + <edge from-layer="5869" from-port="2" to-layer="5870" to-port="1" /> + <edge from-layer="5870" from-port="2" to-layer="7203" to-port="0" /> + <edge from-layer="5870" from-port="2" to-layer="5915" to-port="2" /> + <edge from-layer="5871" from-port="0" to-layer="5893" to-port="0" /> + <edge from-layer="5872" from-port="0" to-layer="5887" to-port="0" /> + <edge from-layer="5873" from-port="0" to-layer="5891" to-port="1" /> + <edge from-layer="5873" from-port="0" to-layer="5887" to-port="1" /> + <edge from-layer="5874" from-port="1" to-layer="5877" to-port="0" /> + <edge from-layer="5875" from-port="0" to-layer="5877" to-port="1" /> + <edge from-layer="5876" from-port="0" to-layer="5877" to-port="2" /> + <edge from-layer="5877" from-port="3" to-layer="5878" to-port="1" /> + <edge from-layer="5878" from-port="2" to-layer="5890" to-port="0" /> + <edge from-layer="5878" from-port="2" to-layer="5883" to-port="0" /> + <edge from-layer="5879" from-port="1" to-layer="5882" to-port="0" /> + <edge from-layer="5879" from-port="1" to-layer="5908" to-port="0" /> + <edge from-layer="5880" from-port="0" to-layer="5882" to-port="1" /> + <edge from-layer="5881" from-port="0" to-layer="5882" to-port="2" /> + <edge from-layer="5882" from-port="3" to-layer="5883" to-port="1" /> + <edge from-layer="5883" from-port="2" to-layer="5885" to-port="0" /> + <edge from-layer="5884" from-port="0" to-layer="5885" to-port="1" /> + <edge from-layer="5885" from-port="2" to-layer="5887" to-port="2" /> + <edge from-layer="5886" from-port="0" to-layer="5887" to-port="3" /> + <edge from-layer="5886" from-port="0" to-layer="5891" to-port="3" /> + <edge from-layer="5887" from-port="4" to-layer="5893" to-port="1" /> + <edge from-layer="5888" from-port="0" to-layer="5891" to-port="0" /> + <edge from-layer="5889" from-port="0" to-layer="5890" to-port="1" /> + <edge from-layer="5890" from-port="2" to-layer="5891" to-port="2" /> + <edge from-layer="5890" from-port="2" to-layer="5898" to-port="2" /> + <edge from-layer="5891" from-port="4" to-layer="5893" to-port="2" /> + <edge from-layer="5892" from-port="0" to-layer="5893" to-port="3" /> + <edge from-layer="5893" from-port="4" to-layer="5900" to-port="0" /> + <edge from-layer="5894" from-port="0" to-layer="5900" to-port="1" /> + <edge from-layer="5895" from-port="0" to-layer="5898" to-port="0" /> + <edge from-layer="5896" from-port="0" to-layer="5898" to-port="1" /> + <edge from-layer="5897" from-port="0" to-layer="5898" to-port="3" /> + <edge from-layer="5898" from-port="4" to-layer="5900" to-port="2" /> + <edge from-layer="5899" from-port="0" to-layer="5900" to-port="3" /> + <edge from-layer="5900" from-port="4" to-layer="5903" to-port="0" /> + <edge from-layer="5901" from-port="0" to-layer="5903" to-port="1" /> + <edge from-layer="5902" from-port="0" to-layer="5903" to-port="2" /> + <edge from-layer="5903" from-port="3" to-layer="5904" to-port="0" /> + <edge from-layer="5904" from-port="2" to-layer="5905" to-port="0" /> + <edge from-layer="5904" from-port="2" to-layer="5914" to-port="0" /> + <edge from-layer="5905" from-port="1" to-layer="5913" to-port="0" /> + <edge from-layer="5906" from-port="0" to-layer="5908" to-port="1" /> + <edge from-layer="5907" from-port="0" to-layer="5908" to-port="2" /> + <edge from-layer="5908" from-port="3" to-layer="5912" to-port="0" /> + <edge from-layer="5909" from-port="0" to-layer="5912" to-port="1" /> + <edge from-layer="5910" from-port="0" to-layer="5912" to-port="2" /> + <edge from-layer="5911" from-port="0" to-layer="5912" to-port="3" /> + <edge from-layer="5912" from-port="4" to-layer="5913" to-port="1" /> + <edge from-layer="5913" from-port="2" to-layer="5914" to-port="1" /> + <edge from-layer="5914" from-port="2" to-layer="5915" to-port="3" /> + <edge from-layer="5915" from-port="4" to-layer="5917" to-port="0" /> + <edge from-layer="5916" from-port="0" to-layer="5917" to-port="1" /> + <edge from-layer="5917" from-port="2" to-layer="5919" to-port="0" /> + <edge from-layer="5918" from-port="0" to-layer="5919" to-port="1" /> + <edge from-layer="5919" from-port="2" to-layer="5928" to-port="0" /> + <edge from-layer="5920" from-port="0" to-layer="5921" to-port="0" /> + <edge from-layer="5921" from-port="1" to-layer="5924" to-port="0" /> + <edge from-layer="5922" from-port="0" to-layer="5923" to-port="0" /> + <edge from-layer="5923" from-port="1" to-layer="5924" to-port="1" /> + <edge from-layer="5924" from-port="2" to-layer="5926" to-port="0" /> + <edge from-layer="5925" from-port="0" to-layer="5926" to-port="1" /> + <edge from-layer="5926" from-port="2" to-layer="5927" to-port="0" /> + <edge from-layer="5927" from-port="1" to-layer="5928" to-port="1" /> + <edge from-layer="5928" from-port="2" to-layer="5930" to-port="0" /> + <edge from-layer="5929" from-port="0" to-layer="5930" to-port="1" /> + <edge from-layer="5930" from-port="2" to-layer="5931" to-port="0" /> + <edge from-layer="5931" from-port="2" to-layer="5933" to-port="0" /> + <edge from-layer="5931" from-port="2" to-layer="5961" to-port="1" /> + <edge from-layer="5932" from-port="0" to-layer="5933" to-port="1" /> + <edge from-layer="5933" from-port="2" to-layer="5935" to-port="0" /> + <edge from-layer="5934" from-port="0" to-layer="5935" to-port="1" /> + <edge from-layer="5935" from-port="2" to-layer="5937" to-port="0" /> + <edge from-layer="5936" from-port="0" to-layer="5937" to-port="1" /> + <edge from-layer="5937" from-port="2" to-layer="5946" to-port="0" /> + <edge from-layer="5938" from-port="0" to-layer="5939" to-port="0" /> + <edge from-layer="5939" from-port="1" to-layer="5942" to-port="0" /> + <edge from-layer="5940" from-port="0" to-layer="5941" to-port="0" /> + <edge from-layer="5941" from-port="1" to-layer="5942" to-port="1" /> + <edge from-layer="5942" from-port="2" to-layer="5944" to-port="0" /> + <edge from-layer="5943" from-port="0" to-layer="5944" to-port="1" /> + <edge from-layer="5944" from-port="2" to-layer="5945" to-port="0" /> + <edge from-layer="5945" from-port="1" to-layer="5946" to-port="1" /> + <edge from-layer="5946" from-port="2" to-layer="5948" to-port="0" /> + <edge from-layer="5947" from-port="0" to-layer="5948" to-port="1" /> + <edge from-layer="5948" from-port="2" to-layer="5949" to-port="0" /> + <edge from-layer="5949" from-port="1" to-layer="5958" to-port="0" /> + <edge from-layer="5950" from-port="0" to-layer="5951" to-port="0" /> + <edge from-layer="5951" from-port="1" to-layer="5954" to-port="0" /> + <edge from-layer="5952" from-port="0" to-layer="5953" to-port="0" /> + <edge from-layer="5953" from-port="1" to-layer="5954" to-port="1" /> + <edge from-layer="5954" from-port="2" to-layer="5956" to-port="0" /> + <edge from-layer="5955" from-port="0" to-layer="5956" to-port="1" /> + <edge from-layer="5956" from-port="2" to-layer="5957" to-port="0" /> + <edge from-layer="5957" from-port="1" to-layer="5958" to-port="1" /> + <edge from-layer="5958" from-port="2" to-layer="5960" to-port="0" /> + <edge from-layer="5959" from-port="0" to-layer="5960" to-port="1" /> + <edge from-layer="5960" from-port="2" to-layer="5961" to-port="0" /> + <edge from-layer="5961" from-port="2" to-layer="6158" to-port="1" /> + <edge from-layer="5961" from-port="2" to-layer="5963" to-port="0" /> + <edge from-layer="5962" from-port="0" to-layer="5963" to-port="1" /> + <edge from-layer="5963" from-port="2" to-layer="5965" to-port="0" /> + <edge from-layer="5964" from-port="0" to-layer="5965" to-port="1" /> + <edge from-layer="5965" from-port="2" to-layer="5967" to-port="0" /> + <edge from-layer="5966" from-port="0" to-layer="5967" to-port="1" /> + <edge from-layer="5967" from-port="2" to-layer="5976" to-port="0" /> + <edge from-layer="5968" from-port="0" to-layer="5969" to-port="0" /> + <edge from-layer="5969" from-port="1" to-layer="5972" to-port="0" /> + <edge from-layer="5970" from-port="0" to-layer="5971" to-port="0" /> + <edge from-layer="5971" from-port="1" to-layer="5972" to-port="1" /> + <edge from-layer="5972" from-port="2" to-layer="5974" to-port="0" /> + <edge from-layer="5973" from-port="0" to-layer="5974" to-port="1" /> + <edge from-layer="5974" from-port="2" to-layer="5975" to-port="0" /> + <edge from-layer="5975" from-port="1" to-layer="5976" to-port="1" /> + <edge from-layer="5976" from-port="2" to-layer="5978" to-port="0" /> + <edge from-layer="5977" from-port="0" to-layer="5978" to-port="1" /> + <edge from-layer="5978" from-port="2" to-layer="5980" to-port="0" /> + <edge from-layer="5979" from-port="0" to-layer="5980" to-port="1" /> + <edge from-layer="5980" from-port="2" to-layer="6094" to-port="0" /> + <edge from-layer="5980" from-port="2" to-layer="5996" to-port="0" /> + <edge from-layer="5980" from-port="2" to-layer="5984" to-port="0" /> + <edge from-layer="5981" from-port="0" to-layer="5984" to-port="1" /> + <edge from-layer="5982" from-port="0" to-layer="5984" to-port="2" /> + <edge from-layer="5983" from-port="0" to-layer="5984" to-port="3" /> + <edge from-layer="5984" from-port="4" to-layer="5986" to-port="0" /> + <edge from-layer="5985" from-port="0" to-layer="5986" to-port="1" /> + <edge from-layer="5986" from-port="2" to-layer="5990" to-port="0" /> + <edge from-layer="5987" from-port="0" to-layer="5990" to-port="1" /> + <edge from-layer="5988" from-port="0" to-layer="5990" to-port="2" /> + <edge from-layer="5989" from-port="0" to-layer="5990" to-port="3" /> + <edge from-layer="5990" from-port="4" to-layer="6036" to-port="0" /> + <edge from-layer="5990" from-port="4" to-layer="6022" to-port="0" /> + <edge from-layer="5990" from-port="4" to-layer="6025" to-port="0" /> + <edge from-layer="5990" from-port="4" to-layer="6041" to-port="0" /> + <edge from-layer="5991" from-port="0" to-layer="6018" to-port="0" /> + <edge from-layer="5992" from-port="0" to-layer="6018" to-port="1" /> + <edge from-layer="5993" from-port="0" to-layer="5996" to-port="1" /> + <edge from-layer="5994" from-port="0" to-layer="5996" to-port="2" /> + <edge from-layer="5995" from-port="0" to-layer="5996" to-port="3" /> + <edge from-layer="5996" from-port="4" to-layer="5997" to-port="0" /> + <edge from-layer="5996" from-port="4" to-layer="6053" to-port="0" /> + <edge from-layer="5997" from-port="1" to-layer="6000" to-port="0" /> + <edge from-layer="5998" from-port="0" to-layer="6000" to-port="1" /> + <edge from-layer="5999" from-port="0" to-layer="6000" to-port="2" /> + <edge from-layer="6000" from-port="3" to-layer="6016" to-port="0" /> + <edge from-layer="6001" from-port="0" to-layer="6006" to-port="0" /> + <edge from-layer="6002" from-port="0" to-layer="6005" to-port="1" /> + <edge from-layer="6003" from-port="0" to-layer="6005" to-port="2" /> + <edge from-layer="6004" from-port="0" to-layer="6005" to-port="3" /> + <edge from-layer="6005" from-port="4" to-layer="6006" to-port="1" /> + <edge from-layer="6006" from-port="2" to-layer="6007" to-port="0" /> + <edge from-layer="6007" from-port="1" to-layer="6009" to-port="0" /> + <edge from-layer="6008" from-port="0" to-layer="6009" to-port="2" /> + <edge from-layer="6009" from-port="3" to-layer="6010" to-port="0" /> + <edge from-layer="6009" from-port="3" to-layer="6081" to-port="0" /> + <edge from-layer="6010" from-port="1" to-layer="6013" to-port="0" /> + <edge from-layer="6011" from-port="0" to-layer="6013" to-port="1" /> + <edge from-layer="6012" from-port="0" to-layer="6013" to-port="2" /> + <edge from-layer="6013" from-port="3" to-layer="6015" to-port="0" /> + <edge from-layer="6013" from-port="3" to-layer="6105" to-port="0" /> + <edge from-layer="6014" from-port="0" to-layer="6015" to-port="1" /> + <edge from-layer="6015" from-port="2" to-layer="6016" to-port="1" /> + <edge from-layer="6016" from-port="2" to-layer="6018" to-port="2" /> + <edge from-layer="6016" from-port="2" to-layer="6046" to-port="2" /> + <edge from-layer="6017" from-port="0" to-layer="6018" to-port="3" /> + <edge from-layer="6018" from-port="4" to-layer="6020" to-port="0" /> + <edge from-layer="6019" from-port="0" to-layer="6020" to-port="2" /> + <edge from-layer="6020" from-port="3" to-layer="6021" to-port="0" /> + <edge from-layer="6021" from-port="2" to-layer="6022" to-port="1" /> + <edge from-layer="6021" from-port="2" to-layer="6058" to-port="1" /> + <edge from-layer="6022" from-port="2" to-layer="6051" to-port="0" /> + <edge from-layer="6023" from-port="0" to-layer="6033" to-port="0" /> + <edge from-layer="6024" from-port="0" to-layer="6033" to-port="1" /> + <edge from-layer="6025" from-port="1" to-layer="6027" to-port="0" /> + <edge from-layer="6026" from-port="0" to-layer="6027" to-port="2" /> + <edge from-layer="6027" from-port="3" to-layer="6028" to-port="0" /> + <edge from-layer="6028" from-port="2" to-layer="6029" to-port="0" /> + <edge from-layer="6029" from-port="1" to-layer="6031" to-port="0" /> + <edge from-layer="6030" from-port="0" to-layer="6031" to-port="1" /> + <edge from-layer="6031" from-port="2" to-layer="6033" to-port="2" /> + <edge from-layer="6032" from-port="0" to-layer="6033" to-port="3" /> + <edge from-layer="6033" from-port="4" to-layer="6041" to-port="2" /> + <edge from-layer="6033" from-port="4" to-layer="6036" to-port="1" /> + <edge from-layer="6034" from-port="0" to-layer="6036" to-port="2" /> + <edge from-layer="6035" from-port="0" to-layer="6036" to-port="3" /> + <edge from-layer="6036" from-port="4" to-layer="6038" to-port="0" /> + <edge from-layer="6037" from-port="0" to-layer="6038" to-port="1" /> + <edge from-layer="6038" from-port="2" to-layer="6042" to-port="0" /> + <edge from-layer="6039" from-port="0" to-layer="6041" to-port="1" /> + <edge from-layer="6040" from-port="0" to-layer="6041" to-port="3" /> + <edge from-layer="6041" from-port="4" to-layer="6042" to-port="1" /> + <edge from-layer="6042" from-port="2" to-layer="6050" to-port="0" /> + <edge from-layer="6043" from-port="0" to-layer="6046" to-port="0" /> + <edge from-layer="6044" from-port="0" to-layer="6046" to-port="1" /> + <edge from-layer="6045" from-port="0" to-layer="6046" to-port="3" /> + <edge from-layer="6046" from-port="4" to-layer="6048" to-port="0" /> + <edge from-layer="6047" from-port="0" to-layer="6048" to-port="2" /> + <edge from-layer="6048" from-port="3" to-layer="6049" to-port="0" /> + <edge from-layer="6049" from-port="2" to-layer="6050" to-port="1" /> + <edge from-layer="6049" from-port="2" to-layer="6079" to-port="1" /> + <edge from-layer="6050" from-port="2" to-layer="6051" to-port="1" /> + <edge from-layer="6051" from-port="2" to-layer="6142" to-port="0" /> + <edge from-layer="6051" from-port="2" to-layer="6106" to-port="0" /> + <edge from-layer="6052" from-port="0" to-layer="6053" to-port="1" /> + <edge from-layer="6053" from-port="2" to-layer="6057" to-port="0" /> + <edge from-layer="6054" from-port="0" to-layer="6057" to-port="1" /> + <edge from-layer="6055" from-port="0" to-layer="6057" to-port="2" /> + <edge from-layer="6056" from-port="0" to-layer="6057" to-port="3" /> + <edge from-layer="6057" from-port="4" to-layer="6077" to-port="0" /> + <edge from-layer="6057" from-port="4" to-layer="6072" to-port="0" /> + <edge from-layer="6057" from-port="4" to-layer="6058" to-port="0" /> + <edge from-layer="6057" from-port="4" to-layer="6061" to-port="0" /> + <edge from-layer="6058" from-port="2" to-layer="6080" to-port="0" /> + <edge from-layer="6059" from-port="0" to-layer="6069" to-port="0" /> + <edge from-layer="6060" from-port="0" to-layer="6069" to-port="1" /> + <edge from-layer="6061" from-port="1" to-layer="6063" to-port="0" /> + <edge from-layer="6062" from-port="0" to-layer="6063" to-port="2" /> + <edge from-layer="6063" from-port="3" to-layer="6064" to-port="0" /> + <edge from-layer="6064" from-port="2" to-layer="6065" to-port="0" /> + <edge from-layer="6065" from-port="1" to-layer="6067" to-port="0" /> + <edge from-layer="6066" from-port="0" to-layer="6067" to-port="1" /> + <edge from-layer="6067" from-port="2" to-layer="6069" to-port="2" /> + <edge from-layer="6068" from-port="0" to-layer="6069" to-port="3" /> + <edge from-layer="6069" from-port="4" to-layer="6072" to-port="1" /> + <edge from-layer="6069" from-port="4" to-layer="6077" to-port="2" /> + <edge from-layer="6070" from-port="0" to-layer="6072" to-port="2" /> + <edge from-layer="6071" from-port="0" to-layer="6072" to-port="3" /> + <edge from-layer="6072" from-port="4" to-layer="6074" to-port="0" /> + <edge from-layer="6073" from-port="0" to-layer="6074" to-port="1" /> + <edge from-layer="6074" from-port="2" to-layer="6078" to-port="0" /> + <edge from-layer="6075" from-port="0" to-layer="6077" to-port="1" /> + <edge from-layer="6076" from-port="0" to-layer="6077" to-port="3" /> + <edge from-layer="6077" from-port="4" to-layer="6078" to-port="1" /> + <edge from-layer="6078" from-port="2" to-layer="6079" to-port="0" /> + <edge from-layer="6079" from-port="2" to-layer="6080" to-port="1" /> + <edge from-layer="6080" from-port="2" to-layer="6081" to-port="1" /> + <edge from-layer="6080" from-port="2" to-layer="6101" to-port="0" /> + <edge from-layer="6081" from-port="2" to-layer="7202" to-port="0" /> + <edge from-layer="6081" from-port="2" to-layer="6142" to-port="1" /> + <edge from-layer="6082" from-port="0" to-layer="6087" to-port="0" /> + <edge from-layer="6083" from-port="0" to-layer="6086" to-port="1" /> + <edge from-layer="6084" from-port="0" to-layer="6086" to-port="2" /> + <edge from-layer="6085" from-port="0" to-layer="6086" to-port="3" /> + <edge from-layer="6086" from-port="4" to-layer="6087" to-port="1" /> + <edge from-layer="6087" from-port="2" to-layer="6088" to-port="0" /> + <edge from-layer="6088" from-port="1" to-layer="6090" to-port="0" /> + <edge from-layer="6089" from-port="0" to-layer="6090" to-port="2" /> + <edge from-layer="6090" from-port="3" to-layer="6097" to-port="0" /> + <edge from-layer="6091" from-port="0" to-layer="6094" to-port="1" /> + <edge from-layer="6092" from-port="0" to-layer="6094" to-port="2" /> + <edge from-layer="6093" from-port="0" to-layer="6094" to-port="3" /> + <edge from-layer="6094" from-port="4" to-layer="6096" to-port="0" /> + <edge from-layer="6095" from-port="0" to-layer="6096" to-port="1" /> + <edge from-layer="6096" from-port="2" to-layer="6097" to-port="1" /> + <edge from-layer="6097" from-port="2" to-layer="6142" to-port="2" /> + <edge from-layer="6097" from-port="2" to-layer="7201" to-port="0" /> + <edge from-layer="6098" from-port="0" to-layer="6120" to-port="0" /> + <edge from-layer="6099" from-port="0" to-layer="6114" to-port="0" /> + <edge from-layer="6100" from-port="0" to-layer="6114" to-port="1" /> + <edge from-layer="6100" from-port="0" to-layer="6118" to-port="1" /> + <edge from-layer="6101" from-port="1" to-layer="6104" to-port="0" /> + <edge from-layer="6102" from-port="0" to-layer="6104" to-port="1" /> + <edge from-layer="6103" from-port="0" to-layer="6104" to-port="2" /> + <edge from-layer="6104" from-port="3" to-layer="6105" to-port="1" /> + <edge from-layer="6105" from-port="2" to-layer="6110" to-port="0" /> + <edge from-layer="6105" from-port="2" to-layer="6117" to-port="0" /> + <edge from-layer="6106" from-port="1" to-layer="6109" to-port="0" /> + <edge from-layer="6106" from-port="1" to-layer="6135" to-port="0" /> + <edge from-layer="6107" from-port="0" to-layer="6109" to-port="1" /> + <edge from-layer="6108" from-port="0" to-layer="6109" to-port="2" /> + <edge from-layer="6109" from-port="3" to-layer="6110" to-port="1" /> + <edge from-layer="6110" from-port="2" to-layer="6112" to-port="0" /> + <edge from-layer="6111" from-port="0" to-layer="6112" to-port="1" /> + <edge from-layer="6112" from-port="2" to-layer="6114" to-port="2" /> + <edge from-layer="6113" from-port="0" to-layer="6114" to-port="3" /> + <edge from-layer="6113" from-port="0" to-layer="6118" to-port="3" /> + <edge from-layer="6114" from-port="4" to-layer="6120" to-port="1" /> + <edge from-layer="6115" from-port="0" to-layer="6118" to-port="0" /> + <edge from-layer="6116" from-port="0" to-layer="6117" to-port="1" /> + <edge from-layer="6117" from-port="2" to-layer="6125" to-port="2" /> + <edge from-layer="6117" from-port="2" to-layer="6118" to-port="2" /> + <edge from-layer="6118" from-port="4" to-layer="6120" to-port="2" /> + <edge from-layer="6119" from-port="0" to-layer="6120" to-port="3" /> + <edge from-layer="6120" from-port="4" to-layer="6127" to-port="0" /> + <edge from-layer="6121" from-port="0" to-layer="6127" to-port="1" /> + <edge from-layer="6122" from-port="0" to-layer="6125" to-port="0" /> + <edge from-layer="6123" from-port="0" to-layer="6125" to-port="1" /> + <edge from-layer="6124" from-port="0" to-layer="6125" to-port="3" /> + <edge from-layer="6125" from-port="4" to-layer="6127" to-port="2" /> + <edge from-layer="6126" from-port="0" to-layer="6127" to-port="3" /> + <edge from-layer="6127" from-port="4" to-layer="6130" to-port="0" /> + <edge from-layer="6128" from-port="0" to-layer="6130" to-port="1" /> + <edge from-layer="6129" from-port="0" to-layer="6130" to-port="2" /> + <edge from-layer="6130" from-port="3" to-layer="6131" to-port="0" /> + <edge from-layer="6131" from-port="2" to-layer="6141" to-port="0" /> + <edge from-layer="6131" from-port="2" to-layer="6132" to-port="0" /> + <edge from-layer="6132" from-port="1" to-layer="6140" to-port="0" /> + <edge from-layer="6133" from-port="0" to-layer="6135" to-port="1" /> + <edge from-layer="6134" from-port="0" to-layer="6135" to-port="2" /> + <edge from-layer="6135" from-port="3" to-layer="6139" to-port="0" /> + <edge from-layer="6136" from-port="0" to-layer="6139" to-port="1" /> + <edge from-layer="6137" from-port="0" to-layer="6139" to-port="2" /> + <edge from-layer="6138" from-port="0" to-layer="6139" to-port="3" /> + <edge from-layer="6139" from-port="4" to-layer="6140" to-port="1" /> + <edge from-layer="6140" from-port="2" to-layer="6141" to-port="1" /> + <edge from-layer="6141" from-port="2" to-layer="6142" to-port="3" /> + <edge from-layer="6142" from-port="4" to-layer="6144" to-port="0" /> + <edge from-layer="6143" from-port="0" to-layer="6144" to-port="1" /> + <edge from-layer="6144" from-port="2" to-layer="6146" to-port="0" /> + <edge from-layer="6145" from-port="0" to-layer="6146" to-port="1" /> + <edge from-layer="6146" from-port="2" to-layer="6155" to-port="0" /> + <edge from-layer="6147" from-port="0" to-layer="6148" to-port="0" /> + <edge from-layer="6148" from-port="1" to-layer="6151" to-port="0" /> + <edge from-layer="6149" from-port="0" to-layer="6150" to-port="0" /> + <edge from-layer="6150" from-port="1" to-layer="6151" to-port="1" /> + <edge from-layer="6151" from-port="2" to-layer="6153" to-port="0" /> + <edge from-layer="6152" from-port="0" to-layer="6153" to-port="1" /> + <edge from-layer="6153" from-port="2" to-layer="6154" to-port="0" /> + <edge from-layer="6154" from-port="1" to-layer="6155" to-port="1" /> + <edge from-layer="6155" from-port="2" to-layer="6157" to-port="0" /> + <edge from-layer="6156" from-port="0" to-layer="6157" to-port="1" /> + <edge from-layer="6157" from-port="2" to-layer="6158" to-port="0" /> + <edge from-layer="6158" from-port="2" to-layer="6160" to-port="0" /> + <edge from-layer="6158" from-port="2" to-layer="6188" to-port="1" /> + <edge from-layer="6159" from-port="0" to-layer="6160" to-port="1" /> + <edge from-layer="6160" from-port="2" to-layer="6162" to-port="0" /> + <edge from-layer="6161" from-port="0" to-layer="6162" to-port="1" /> + <edge from-layer="6162" from-port="2" to-layer="6164" to-port="0" /> + <edge from-layer="6163" from-port="0" to-layer="6164" to-port="1" /> + <edge from-layer="6164" from-port="2" to-layer="6173" to-port="0" /> + <edge from-layer="6165" from-port="0" to-layer="6166" to-port="0" /> + <edge from-layer="6166" from-port="1" to-layer="6169" to-port="0" /> + <edge from-layer="6167" from-port="0" to-layer="6168" to-port="0" /> + <edge from-layer="6168" from-port="1" to-layer="6169" to-port="1" /> + <edge from-layer="6169" from-port="2" to-layer="6171" to-port="0" /> + <edge from-layer="6170" from-port="0" to-layer="6171" to-port="1" /> + <edge from-layer="6171" from-port="2" to-layer="6172" to-port="0" /> + <edge from-layer="6172" from-port="1" to-layer="6173" to-port="1" /> + <edge from-layer="6173" from-port="2" to-layer="6175" to-port="0" /> + <edge from-layer="6174" from-port="0" to-layer="6175" to-port="1" /> + <edge from-layer="6175" from-port="2" to-layer="6176" to-port="0" /> + <edge from-layer="6176" from-port="1" to-layer="6185" to-port="0" /> + <edge from-layer="6177" from-port="0" to-layer="6178" to-port="0" /> + <edge from-layer="6178" from-port="1" to-layer="6181" to-port="0" /> + <edge from-layer="6179" from-port="0" to-layer="6180" to-port="0" /> + <edge from-layer="6180" from-port="1" to-layer="6181" to-port="1" /> + <edge from-layer="6181" from-port="2" to-layer="6183" to-port="0" /> + <edge from-layer="6182" from-port="0" to-layer="6183" to-port="1" /> + <edge from-layer="6183" from-port="2" to-layer="6184" to-port="0" /> + <edge from-layer="6184" from-port="1" to-layer="6185" to-port="1" /> + <edge from-layer="6185" from-port="2" to-layer="6187" to-port="0" /> + <edge from-layer="6186" from-port="0" to-layer="6187" to-port="1" /> + <edge from-layer="6187" from-port="2" to-layer="6188" to-port="0" /> + <edge from-layer="6188" from-port="2" to-layer="6385" to-port="1" /> + <edge from-layer="6188" from-port="2" to-layer="6190" to-port="0" /> + <edge from-layer="6189" from-port="0" to-layer="6190" to-port="1" /> + <edge from-layer="6190" from-port="2" to-layer="6192" to-port="0" /> + <edge from-layer="6191" from-port="0" to-layer="6192" to-port="1" /> + <edge from-layer="6192" from-port="2" to-layer="6194" to-port="0" /> + <edge from-layer="6193" from-port="0" to-layer="6194" to-port="1" /> + <edge from-layer="6194" from-port="2" to-layer="6203" to-port="0" /> + <edge from-layer="6195" from-port="0" to-layer="6196" to-port="0" /> + <edge from-layer="6196" from-port="1" to-layer="6199" to-port="0" /> + <edge from-layer="6197" from-port="0" to-layer="6198" to-port="0" /> + <edge from-layer="6198" from-port="1" to-layer="6199" to-port="1" /> + <edge from-layer="6199" from-port="2" to-layer="6201" to-port="0" /> + <edge from-layer="6200" from-port="0" to-layer="6201" to-port="1" /> + <edge from-layer="6201" from-port="2" to-layer="6202" to-port="0" /> + <edge from-layer="6202" from-port="1" to-layer="6203" to-port="1" /> + <edge from-layer="6203" from-port="2" to-layer="6205" to-port="0" /> + <edge from-layer="6204" from-port="0" to-layer="6205" to-port="1" /> + <edge from-layer="6205" from-port="2" to-layer="6207" to-port="0" /> + <edge from-layer="6206" from-port="0" to-layer="6207" to-port="1" /> + <edge from-layer="6207" from-port="2" to-layer="6223" to-port="0" /> + <edge from-layer="6207" from-port="2" to-layer="6211" to-port="0" /> + <edge from-layer="6207" from-port="2" to-layer="6321" to-port="0" /> + <edge from-layer="6208" from-port="0" to-layer="6211" to-port="1" /> + <edge from-layer="6209" from-port="0" to-layer="6211" to-port="2" /> + <edge from-layer="6210" from-port="0" to-layer="6211" to-port="3" /> + <edge from-layer="6211" from-port="4" to-layer="6213" to-port="0" /> + <edge from-layer="6212" from-port="0" to-layer="6213" to-port="1" /> + <edge from-layer="6213" from-port="2" to-layer="6217" to-port="0" /> + <edge from-layer="6214" from-port="0" to-layer="6217" to-port="1" /> + <edge from-layer="6215" from-port="0" to-layer="6217" to-port="2" /> + <edge from-layer="6216" from-port="0" to-layer="6217" to-port="3" /> + <edge from-layer="6217" from-port="4" to-layer="6263" to-port="0" /> + <edge from-layer="6217" from-port="4" to-layer="6249" to-port="0" /> + <edge from-layer="6217" from-port="4" to-layer="6252" to-port="0" /> + <edge from-layer="6217" from-port="4" to-layer="6268" to-port="0" /> + <edge from-layer="6218" from-port="0" to-layer="6245" to-port="0" /> + <edge from-layer="6219" from-port="0" to-layer="6245" to-port="1" /> + <edge from-layer="6220" from-port="0" to-layer="6223" to-port="1" /> + <edge from-layer="6221" from-port="0" to-layer="6223" to-port="2" /> + <edge from-layer="6222" from-port="0" to-layer="6223" to-port="3" /> + <edge from-layer="6223" from-port="4" to-layer="6280" to-port="0" /> + <edge from-layer="6223" from-port="4" to-layer="6224" to-port="0" /> + <edge from-layer="6224" from-port="1" to-layer="6227" to-port="0" /> + <edge from-layer="6225" from-port="0" to-layer="6227" to-port="1" /> + <edge from-layer="6226" from-port="0" to-layer="6227" to-port="2" /> + <edge from-layer="6227" from-port="3" to-layer="6243" to-port="0" /> + <edge from-layer="6228" from-port="0" to-layer="6233" to-port="0" /> + <edge from-layer="6229" from-port="0" to-layer="6232" to-port="1" /> + <edge from-layer="6230" from-port="0" to-layer="6232" to-port="2" /> + <edge from-layer="6231" from-port="0" to-layer="6232" to-port="3" /> + <edge from-layer="6232" from-port="4" to-layer="6233" to-port="1" /> + <edge from-layer="6233" from-port="2" to-layer="6234" to-port="0" /> + <edge from-layer="6234" from-port="1" to-layer="6236" to-port="0" /> + <edge from-layer="6235" from-port="0" to-layer="6236" to-port="2" /> + <edge from-layer="6236" from-port="3" to-layer="6308" to-port="0" /> + <edge from-layer="6236" from-port="3" to-layer="6237" to-port="0" /> + <edge from-layer="6237" from-port="1" to-layer="6240" to-port="0" /> + <edge from-layer="6238" from-port="0" to-layer="6240" to-port="1" /> + <edge from-layer="6239" from-port="0" to-layer="6240" to-port="2" /> + <edge from-layer="6240" from-port="3" to-layer="6242" to-port="0" /> + <edge from-layer="6240" from-port="3" to-layer="6332" to-port="0" /> + <edge from-layer="6241" from-port="0" to-layer="6242" to-port="1" /> + <edge from-layer="6242" from-port="2" to-layer="6243" to-port="1" /> + <edge from-layer="6243" from-port="2" to-layer="6245" to-port="2" /> + <edge from-layer="6243" from-port="2" to-layer="6273" to-port="2" /> + <edge from-layer="6244" from-port="0" to-layer="6245" to-port="3" /> + <edge from-layer="6245" from-port="4" to-layer="6247" to-port="0" /> + <edge from-layer="6246" from-port="0" to-layer="6247" to-port="2" /> + <edge from-layer="6247" from-port="3" to-layer="6248" to-port="0" /> + <edge from-layer="6248" from-port="2" to-layer="6249" to-port="1" /> + <edge from-layer="6248" from-port="2" to-layer="6285" to-port="1" /> + <edge from-layer="6249" from-port="2" to-layer="6278" to-port="0" /> + <edge from-layer="6250" from-port="0" to-layer="6260" to-port="0" /> + <edge from-layer="6251" from-port="0" to-layer="6260" to-port="1" /> + <edge from-layer="6252" from-port="1" to-layer="6254" to-port="0" /> + <edge from-layer="6253" from-port="0" to-layer="6254" to-port="2" /> + <edge from-layer="6254" from-port="3" to-layer="6255" to-port="0" /> + <edge from-layer="6255" from-port="2" to-layer="6256" to-port="0" /> + <edge from-layer="6256" from-port="1" to-layer="6258" to-port="0" /> + <edge from-layer="6257" from-port="0" to-layer="6258" to-port="1" /> + <edge from-layer="6258" from-port="2" to-layer="6260" to-port="2" /> + <edge from-layer="6259" from-port="0" to-layer="6260" to-port="3" /> + <edge from-layer="6260" from-port="4" to-layer="6263" to-port="1" /> + <edge from-layer="6260" from-port="4" to-layer="6268" to-port="2" /> + <edge from-layer="6261" from-port="0" to-layer="6263" to-port="2" /> + <edge from-layer="6262" from-port="0" to-layer="6263" to-port="3" /> + <edge from-layer="6263" from-port="4" to-layer="6265" to-port="0" /> + <edge from-layer="6264" from-port="0" to-layer="6265" to-port="1" /> + <edge from-layer="6265" from-port="2" to-layer="6269" to-port="0" /> + <edge from-layer="6266" from-port="0" to-layer="6268" to-port="1" /> + <edge from-layer="6267" from-port="0" to-layer="6268" to-port="3" /> + <edge from-layer="6268" from-port="4" to-layer="6269" to-port="1" /> + <edge from-layer="6269" from-port="2" to-layer="6277" to-port="0" /> + <edge from-layer="6270" from-port="0" to-layer="6273" to-port="0" /> + <edge from-layer="6271" from-port="0" to-layer="6273" to-port="1" /> + <edge from-layer="6272" from-port="0" to-layer="6273" to-port="3" /> + <edge from-layer="6273" from-port="4" to-layer="6275" to-port="0" /> + <edge from-layer="6274" from-port="0" to-layer="6275" to-port="2" /> + <edge from-layer="6275" from-port="3" to-layer="6276" to-port="0" /> + <edge from-layer="6276" from-port="2" to-layer="6277" to-port="1" /> + <edge from-layer="6276" from-port="2" to-layer="6306" to-port="1" /> + <edge from-layer="6277" from-port="2" to-layer="6278" to-port="1" /> + <edge from-layer="6278" from-port="2" to-layer="6333" to-port="0" /> + <edge from-layer="6278" from-port="2" to-layer="6369" to-port="0" /> + <edge from-layer="6279" from-port="0" to-layer="6280" to-port="1" /> + <edge from-layer="6280" from-port="2" to-layer="6284" to-port="0" /> + <edge from-layer="6281" from-port="0" to-layer="6284" to-port="1" /> + <edge from-layer="6282" from-port="0" to-layer="6284" to-port="2" /> + <edge from-layer="6283" from-port="0" to-layer="6284" to-port="3" /> + <edge from-layer="6284" from-port="4" to-layer="6304" to-port="0" /> + <edge from-layer="6284" from-port="4" to-layer="6299" to-port="0" /> + <edge from-layer="6284" from-port="4" to-layer="6288" to-port="0" /> + <edge from-layer="6284" from-port="4" to-layer="6285" to-port="0" /> + <edge from-layer="6285" from-port="2" to-layer="6307" to-port="0" /> + <edge from-layer="6286" from-port="0" to-layer="6296" to-port="0" /> + <edge from-layer="6287" from-port="0" to-layer="6296" to-port="1" /> + <edge from-layer="6288" from-port="1" to-layer="6290" to-port="0" /> + <edge from-layer="6289" from-port="0" to-layer="6290" to-port="2" /> + <edge from-layer="6290" from-port="3" to-layer="6291" to-port="0" /> + <edge from-layer="6291" from-port="2" to-layer="6292" to-port="0" /> + <edge from-layer="6292" from-port="1" to-layer="6294" to-port="0" /> + <edge from-layer="6293" from-port="0" to-layer="6294" to-port="1" /> + <edge from-layer="6294" from-port="2" to-layer="6296" to-port="2" /> + <edge from-layer="6295" from-port="0" to-layer="6296" to-port="3" /> + <edge from-layer="6296" from-port="4" to-layer="6304" to-port="2" /> + <edge from-layer="6296" from-port="4" to-layer="6299" to-port="1" /> + <edge from-layer="6297" from-port="0" to-layer="6299" to-port="2" /> + <edge from-layer="6298" from-port="0" to-layer="6299" to-port="3" /> + <edge from-layer="6299" from-port="4" to-layer="6301" to-port="0" /> + <edge from-layer="6300" from-port="0" to-layer="6301" to-port="1" /> + <edge from-layer="6301" from-port="2" to-layer="6305" to-port="0" /> + <edge from-layer="6302" from-port="0" to-layer="6304" to-port="1" /> + <edge from-layer="6303" from-port="0" to-layer="6304" to-port="3" /> + <edge from-layer="6304" from-port="4" to-layer="6305" to-port="1" /> + <edge from-layer="6305" from-port="2" to-layer="6306" to-port="0" /> + <edge from-layer="6306" from-port="2" to-layer="6307" to-port="1" /> + <edge from-layer="6307" from-port="2" to-layer="6328" to-port="0" /> + <edge from-layer="6307" from-port="2" to-layer="6308" to-port="1" /> + <edge from-layer="6308" from-port="2" to-layer="7200" to-port="0" /> + <edge from-layer="6308" from-port="2" to-layer="6369" to-port="1" /> + <edge from-layer="6309" from-port="0" to-layer="6314" to-port="0" /> + <edge from-layer="6310" from-port="0" to-layer="6313" to-port="1" /> + <edge from-layer="6311" from-port="0" to-layer="6313" to-port="2" /> + <edge from-layer="6312" from-port="0" to-layer="6313" to-port="3" /> + <edge from-layer="6313" from-port="4" to-layer="6314" to-port="1" /> + <edge from-layer="6314" from-port="2" to-layer="6315" to-port="0" /> + <edge from-layer="6315" from-port="1" to-layer="6317" to-port="0" /> + <edge from-layer="6316" from-port="0" to-layer="6317" to-port="2" /> + <edge from-layer="6317" from-port="3" to-layer="6324" to-port="0" /> + <edge from-layer="6318" from-port="0" to-layer="6321" to-port="1" /> + <edge from-layer="6319" from-port="0" to-layer="6321" to-port="2" /> + <edge from-layer="6320" from-port="0" to-layer="6321" to-port="3" /> + <edge from-layer="6321" from-port="4" to-layer="6323" to-port="0" /> + <edge from-layer="6322" from-port="0" to-layer="6323" to-port="1" /> + <edge from-layer="6323" from-port="2" to-layer="6324" to-port="1" /> + <edge from-layer="6324" from-port="2" to-layer="6369" to-port="2" /> + <edge from-layer="6324" from-port="2" to-layer="7199" to-port="0" /> + <edge from-layer="6325" from-port="0" to-layer="6347" to-port="0" /> + <edge from-layer="6326" from-port="0" to-layer="6341" to-port="0" /> + <edge from-layer="6327" from-port="0" to-layer="6345" to-port="1" /> + <edge from-layer="6327" from-port="0" to-layer="6341" to-port="1" /> + <edge from-layer="6328" from-port="1" to-layer="6331" to-port="0" /> + <edge from-layer="6329" from-port="0" to-layer="6331" to-port="1" /> + <edge from-layer="6330" from-port="0" to-layer="6331" to-port="2" /> + <edge from-layer="6331" from-port="3" to-layer="6332" to-port="1" /> + <edge from-layer="6332" from-port="2" to-layer="6337" to-port="0" /> + <edge from-layer="6332" from-port="2" to-layer="6344" to-port="0" /> + <edge from-layer="6333" from-port="1" to-layer="6336" to-port="0" /> + <edge from-layer="6333" from-port="1" to-layer="6362" to-port="0" /> + <edge from-layer="6334" from-port="0" to-layer="6336" to-port="1" /> + <edge from-layer="6335" from-port="0" to-layer="6336" to-port="2" /> + <edge from-layer="6336" from-port="3" to-layer="6337" to-port="1" /> + <edge from-layer="6337" from-port="2" to-layer="6339" to-port="0" /> + <edge from-layer="6338" from-port="0" to-layer="6339" to-port="1" /> + <edge from-layer="6339" from-port="2" to-layer="6341" to-port="2" /> + <edge from-layer="6340" from-port="0" to-layer="6341" to-port="3" /> + <edge from-layer="6340" from-port="0" to-layer="6345" to-port="3" /> + <edge from-layer="6341" from-port="4" to-layer="6347" to-port="1" /> + <edge from-layer="6342" from-port="0" to-layer="6345" to-port="0" /> + <edge from-layer="6343" from-port="0" to-layer="6344" to-port="1" /> + <edge from-layer="6344" from-port="2" to-layer="6345" to-port="2" /> + <edge from-layer="6344" from-port="2" to-layer="6352" to-port="2" /> + <edge from-layer="6345" from-port="4" to-layer="6347" to-port="2" /> + <edge from-layer="6346" from-port="0" to-layer="6347" to-port="3" /> + <edge from-layer="6347" from-port="4" to-layer="6354" to-port="0" /> + <edge from-layer="6348" from-port="0" to-layer="6354" to-port="1" /> + <edge from-layer="6349" from-port="0" to-layer="6352" to-port="0" /> + <edge from-layer="6350" from-port="0" to-layer="6352" to-port="1" /> + <edge from-layer="6351" from-port="0" to-layer="6352" to-port="3" /> + <edge from-layer="6352" from-port="4" to-layer="6354" to-port="2" /> + <edge from-layer="6353" from-port="0" to-layer="6354" to-port="3" /> + <edge from-layer="6354" from-port="4" to-layer="6357" to-port="0" /> + <edge from-layer="6355" from-port="0" to-layer="6357" to-port="1" /> + <edge from-layer="6356" from-port="0" to-layer="6357" to-port="2" /> + <edge from-layer="6357" from-port="3" to-layer="6358" to-port="0" /> + <edge from-layer="6358" from-port="2" to-layer="6359" to-port="0" /> + <edge from-layer="6358" from-port="2" to-layer="6368" to-port="0" /> + <edge from-layer="6359" from-port="1" to-layer="6367" to-port="0" /> + <edge from-layer="6360" from-port="0" to-layer="6362" to-port="1" /> + <edge from-layer="6361" from-port="0" to-layer="6362" to-port="2" /> + <edge from-layer="6362" from-port="3" to-layer="6366" to-port="0" /> + <edge from-layer="6363" from-port="0" to-layer="6366" to-port="1" /> + <edge from-layer="6364" from-port="0" to-layer="6366" to-port="2" /> + <edge from-layer="6365" from-port="0" to-layer="6366" to-port="3" /> + <edge from-layer="6366" from-port="4" to-layer="6367" to-port="1" /> + <edge from-layer="6367" from-port="2" to-layer="6368" to-port="1" /> + <edge from-layer="6368" from-port="2" to-layer="6369" to-port="3" /> + <edge from-layer="6369" from-port="4" to-layer="6371" to-port="0" /> + <edge from-layer="6370" from-port="0" to-layer="6371" to-port="1" /> + <edge from-layer="6371" from-port="2" to-layer="6373" to-port="0" /> + <edge from-layer="6372" from-port="0" to-layer="6373" to-port="1" /> + <edge from-layer="6373" from-port="2" to-layer="6382" to-port="0" /> + <edge from-layer="6374" from-port="0" to-layer="6375" to-port="0" /> + <edge from-layer="6375" from-port="1" to-layer="6378" to-port="0" /> + <edge from-layer="6376" from-port="0" to-layer="6377" to-port="0" /> + <edge from-layer="6377" from-port="1" to-layer="6378" to-port="1" /> + <edge from-layer="6378" from-port="2" to-layer="6380" to-port="0" /> + <edge from-layer="6379" from-port="0" to-layer="6380" to-port="1" /> + <edge from-layer="6380" from-port="2" to-layer="6381" to-port="0" /> + <edge from-layer="6381" from-port="1" to-layer="6382" to-port="1" /> + <edge from-layer="6382" from-port="2" to-layer="6384" to-port="0" /> + <edge from-layer="6383" from-port="0" to-layer="6384" to-port="1" /> + <edge from-layer="6384" from-port="2" to-layer="6385" to-port="0" /> + <edge from-layer="6385" from-port="2" to-layer="6415" to-port="1" /> + <edge from-layer="6385" from-port="2" to-layer="6387" to-port="0" /> + <edge from-layer="6386" from-port="0" to-layer="6387" to-port="1" /> + <edge from-layer="6387" from-port="2" to-layer="6389" to-port="0" /> + <edge from-layer="6388" from-port="0" to-layer="6389" to-port="1" /> + <edge from-layer="6389" from-port="2" to-layer="6391" to-port="0" /> + <edge from-layer="6390" from-port="0" to-layer="6391" to-port="1" /> + <edge from-layer="6391" from-port="2" to-layer="6400" to-port="0" /> + <edge from-layer="6392" from-port="0" to-layer="6393" to-port="0" /> + <edge from-layer="6393" from-port="1" to-layer="6396" to-port="0" /> + <edge from-layer="6394" from-port="0" to-layer="6395" to-port="0" /> + <edge from-layer="6395" from-port="1" to-layer="6396" to-port="1" /> + <edge from-layer="6396" from-port="2" to-layer="6398" to-port="0" /> + <edge from-layer="6397" from-port="0" to-layer="6398" to-port="1" /> + <edge from-layer="6398" from-port="2" to-layer="6399" to-port="0" /> + <edge from-layer="6399" from-port="1" to-layer="6400" to-port="1" /> + <edge from-layer="6400" from-port="2" to-layer="6402" to-port="0" /> + <edge from-layer="6401" from-port="0" to-layer="6402" to-port="1" /> + <edge from-layer="6402" from-port="2" to-layer="6403" to-port="0" /> + <edge from-layer="6403" from-port="1" to-layer="6412" to-port="0" /> + <edge from-layer="6404" from-port="0" to-layer="6405" to-port="0" /> + <edge from-layer="6405" from-port="1" to-layer="6408" to-port="0" /> + <edge from-layer="6406" from-port="0" to-layer="6407" to-port="0" /> + <edge from-layer="6407" from-port="1" to-layer="6408" to-port="1" /> + <edge from-layer="6408" from-port="2" to-layer="6410" to-port="0" /> + <edge from-layer="6409" from-port="0" to-layer="6410" to-port="1" /> + <edge from-layer="6410" from-port="2" to-layer="6411" to-port="0" /> + <edge from-layer="6411" from-port="1" to-layer="6412" to-port="1" /> + <edge from-layer="6412" from-port="2" to-layer="6414" to-port="0" /> + <edge from-layer="6413" from-port="0" to-layer="6414" to-port="1" /> + <edge from-layer="6414" from-port="2" to-layer="6415" to-port="0" /> + <edge from-layer="6415" from-port="2" to-layer="6417" to-port="0" /> + <edge from-layer="6415" from-port="2" to-layer="6612" to-port="1" /> + <edge from-layer="6416" from-port="0" to-layer="6417" to-port="1" /> + <edge from-layer="6417" from-port="2" to-layer="6419" to-port="0" /> + <edge from-layer="6418" from-port="0" to-layer="6419" to-port="1" /> + <edge from-layer="6419" from-port="2" to-layer="6421" to-port="0" /> + <edge from-layer="6420" from-port="0" to-layer="6421" to-port="1" /> + <edge from-layer="6421" from-port="2" to-layer="6430" to-port="0" /> + <edge from-layer="6422" from-port="0" to-layer="6423" to-port="0" /> + <edge from-layer="6423" from-port="1" to-layer="6426" to-port="0" /> + <edge from-layer="6424" from-port="0" to-layer="6425" to-port="0" /> + <edge from-layer="6425" from-port="1" to-layer="6426" to-port="1" /> + <edge from-layer="6426" from-port="2" to-layer="6428" to-port="0" /> + <edge from-layer="6427" from-port="0" to-layer="6428" to-port="1" /> + <edge from-layer="6428" from-port="2" to-layer="6429" to-port="0" /> + <edge from-layer="6429" from-port="1" to-layer="6430" to-port="1" /> + <edge from-layer="6430" from-port="2" to-layer="6432" to-port="0" /> + <edge from-layer="6431" from-port="0" to-layer="6432" to-port="1" /> + <edge from-layer="6432" from-port="2" to-layer="6434" to-port="0" /> + <edge from-layer="6433" from-port="0" to-layer="6434" to-port="1" /> + <edge from-layer="6434" from-port="2" to-layer="6548" to-port="0" /> + <edge from-layer="6434" from-port="2" to-layer="6438" to-port="0" /> + <edge from-layer="6434" from-port="2" to-layer="6450" to-port="0" /> + <edge from-layer="6435" from-port="0" to-layer="6438" to-port="1" /> + <edge from-layer="6436" from-port="0" to-layer="6438" to-port="2" /> + <edge from-layer="6437" from-port="0" to-layer="6438" to-port="3" /> + <edge from-layer="6438" from-port="4" to-layer="6440" to-port="0" /> + <edge from-layer="6439" from-port="0" to-layer="6440" to-port="1" /> + <edge from-layer="6440" from-port="2" to-layer="6444" to-port="0" /> + <edge from-layer="6441" from-port="0" to-layer="6444" to-port="1" /> + <edge from-layer="6442" from-port="0" to-layer="6444" to-port="2" /> + <edge from-layer="6443" from-port="0" to-layer="6444" to-port="3" /> + <edge from-layer="6444" from-port="4" to-layer="6490" to-port="0" /> + <edge from-layer="6444" from-port="4" to-layer="6495" to-port="0" /> + <edge from-layer="6444" from-port="4" to-layer="6476" to-port="0" /> + <edge from-layer="6444" from-port="4" to-layer="6479" to-port="0" /> + <edge from-layer="6445" from-port="0" to-layer="6472" to-port="0" /> + <edge from-layer="6446" from-port="0" to-layer="6472" to-port="1" /> + <edge from-layer="6447" from-port="0" to-layer="6450" to-port="1" /> + <edge from-layer="6448" from-port="0" to-layer="6450" to-port="2" /> + <edge from-layer="6449" from-port="0" to-layer="6450" to-port="3" /> + <edge from-layer="6450" from-port="4" to-layer="6507" to-port="0" /> + <edge from-layer="6450" from-port="4" to-layer="6451" to-port="0" /> + <edge from-layer="6451" from-port="1" to-layer="6454" to-port="0" /> + <edge from-layer="6452" from-port="0" to-layer="6454" to-port="1" /> + <edge from-layer="6453" from-port="0" to-layer="6454" to-port="2" /> + <edge from-layer="6454" from-port="3" to-layer="6470" to-port="0" /> + <edge from-layer="6455" from-port="0" to-layer="6460" to-port="0" /> + <edge from-layer="6456" from-port="0" to-layer="6459" to-port="1" /> + <edge from-layer="6457" from-port="0" to-layer="6459" to-port="2" /> + <edge from-layer="6458" from-port="0" to-layer="6459" to-port="3" /> + <edge from-layer="6459" from-port="4" to-layer="6460" to-port="1" /> + <edge from-layer="6460" from-port="2" to-layer="6461" to-port="0" /> + <edge from-layer="6461" from-port="1" to-layer="6463" to-port="0" /> + <edge from-layer="6462" from-port="0" to-layer="6463" to-port="2" /> + <edge from-layer="6463" from-port="3" to-layer="6464" to-port="0" /> + <edge from-layer="6463" from-port="3" to-layer="6535" to-port="0" /> + <edge from-layer="6464" from-port="1" to-layer="6467" to-port="0" /> + <edge from-layer="6465" from-port="0" to-layer="6467" to-port="1" /> + <edge from-layer="6466" from-port="0" to-layer="6467" to-port="2" /> + <edge from-layer="6467" from-port="3" to-layer="6469" to-port="0" /> + <edge from-layer="6467" from-port="3" to-layer="6559" to-port="0" /> + <edge from-layer="6468" from-port="0" to-layer="6469" to-port="1" /> + <edge from-layer="6469" from-port="2" to-layer="6470" to-port="1" /> + <edge from-layer="6470" from-port="2" to-layer="6472" to-port="2" /> + <edge from-layer="6470" from-port="2" to-layer="6500" to-port="2" /> + <edge from-layer="6471" from-port="0" to-layer="6472" to-port="3" /> + <edge from-layer="6472" from-port="4" to-layer="6474" to-port="0" /> + <edge from-layer="6473" from-port="0" to-layer="6474" to-port="2" /> + <edge from-layer="6474" from-port="3" to-layer="6475" to-port="0" /> + <edge from-layer="6475" from-port="2" to-layer="6512" to-port="1" /> + <edge from-layer="6475" from-port="2" to-layer="6476" to-port="1" /> + <edge from-layer="6476" from-port="2" to-layer="6505" to-port="0" /> + <edge from-layer="6477" from-port="0" to-layer="6487" to-port="0" /> + <edge from-layer="6478" from-port="0" to-layer="6487" to-port="1" /> + <edge from-layer="6479" from-port="1" to-layer="6481" to-port="0" /> + <edge from-layer="6480" from-port="0" to-layer="6481" to-port="2" /> + <edge from-layer="6481" from-port="3" to-layer="6482" to-port="0" /> + <edge from-layer="6482" from-port="2" to-layer="6483" to-port="0" /> + <edge from-layer="6483" from-port="1" to-layer="6485" to-port="0" /> + <edge from-layer="6484" from-port="0" to-layer="6485" to-port="1" /> + <edge from-layer="6485" from-port="2" to-layer="6487" to-port="2" /> + <edge from-layer="6486" from-port="0" to-layer="6487" to-port="3" /> + <edge from-layer="6487" from-port="4" to-layer="6495" to-port="2" /> + <edge from-layer="6487" from-port="4" to-layer="6490" to-port="1" /> + <edge from-layer="6488" from-port="0" to-layer="6490" to-port="2" /> + <edge from-layer="6489" from-port="0" to-layer="6490" to-port="3" /> + <edge from-layer="6490" from-port="4" to-layer="6492" to-port="0" /> + <edge from-layer="6491" from-port="0" to-layer="6492" to-port="1" /> + <edge from-layer="6492" from-port="2" to-layer="6496" to-port="0" /> + <edge from-layer="6493" from-port="0" to-layer="6495" to-port="1" /> + <edge from-layer="6494" from-port="0" to-layer="6495" to-port="3" /> + <edge from-layer="6495" from-port="4" to-layer="6496" to-port="1" /> + <edge from-layer="6496" from-port="2" to-layer="6504" to-port="0" /> + <edge from-layer="6497" from-port="0" to-layer="6500" to-port="0" /> + <edge from-layer="6498" from-port="0" to-layer="6500" to-port="1" /> + <edge from-layer="6499" from-port="0" to-layer="6500" to-port="3" /> + <edge from-layer="6500" from-port="4" to-layer="6502" to-port="0" /> + <edge from-layer="6501" from-port="0" to-layer="6502" to-port="2" /> + <edge from-layer="6502" from-port="3" to-layer="6503" to-port="0" /> + <edge from-layer="6503" from-port="2" to-layer="6504" to-port="1" /> + <edge from-layer="6503" from-port="2" to-layer="6533" to-port="1" /> + <edge from-layer="6504" from-port="2" to-layer="6505" to-port="1" /> + <edge from-layer="6505" from-port="2" to-layer="6560" to-port="0" /> + <edge from-layer="6505" from-port="2" to-layer="6596" to-port="0" /> + <edge from-layer="6506" from-port="0" to-layer="6507" to-port="1" /> + <edge from-layer="6507" from-port="2" to-layer="6511" to-port="0" /> + <edge from-layer="6508" from-port="0" to-layer="6511" to-port="1" /> + <edge from-layer="6509" from-port="0" to-layer="6511" to-port="2" /> + <edge from-layer="6510" from-port="0" to-layer="6511" to-port="3" /> + <edge from-layer="6511" from-port="4" to-layer="6526" to-port="0" /> + <edge from-layer="6511" from-port="4" to-layer="6531" to-port="0" /> + <edge from-layer="6511" from-port="4" to-layer="6515" to-port="0" /> + <edge from-layer="6511" from-port="4" to-layer="6512" to-port="0" /> + <edge from-layer="6512" from-port="2" to-layer="6534" to-port="0" /> + <edge from-layer="6513" from-port="0" to-layer="6523" to-port="0" /> + <edge from-layer="6514" from-port="0" to-layer="6523" to-port="1" /> + <edge from-layer="6515" from-port="1" to-layer="6517" to-port="0" /> + <edge from-layer="6516" from-port="0" to-layer="6517" to-port="2" /> + <edge from-layer="6517" from-port="3" to-layer="6518" to-port="0" /> + <edge from-layer="6518" from-port="2" to-layer="6519" to-port="0" /> + <edge from-layer="6519" from-port="1" to-layer="6521" to-port="0" /> + <edge from-layer="6520" from-port="0" to-layer="6521" to-port="1" /> + <edge from-layer="6521" from-port="2" to-layer="6523" to-port="2" /> + <edge from-layer="6522" from-port="0" to-layer="6523" to-port="3" /> + <edge from-layer="6523" from-port="4" to-layer="6526" to-port="1" /> + <edge from-layer="6523" from-port="4" to-layer="6531" to-port="2" /> + <edge from-layer="6524" from-port="0" to-layer="6526" to-port="2" /> + <edge from-layer="6525" from-port="0" to-layer="6526" to-port="3" /> + <edge from-layer="6526" from-port="4" to-layer="6528" to-port="0" /> + <edge from-layer="6527" from-port="0" to-layer="6528" to-port="1" /> + <edge from-layer="6528" from-port="2" to-layer="6532" to-port="0" /> + <edge from-layer="6529" from-port="0" to-layer="6531" to-port="1" /> + <edge from-layer="6530" from-port="0" to-layer="6531" to-port="3" /> + <edge from-layer="6531" from-port="4" to-layer="6532" to-port="1" /> + <edge from-layer="6532" from-port="2" to-layer="6533" to-port="0" /> + <edge from-layer="6533" from-port="2" to-layer="6534" to-port="1" /> + <edge from-layer="6534" from-port="2" to-layer="6555" to-port="0" /> + <edge from-layer="6534" from-port="2" to-layer="6535" to-port="1" /> + <edge from-layer="6535" from-port="2" to-layer="7198" to-port="0" /> + <edge from-layer="6535" from-port="2" to-layer="6596" to-port="1" /> + <edge from-layer="6536" from-port="0" to-layer="6541" to-port="0" /> + <edge from-layer="6537" from-port="0" to-layer="6540" to-port="1" /> + <edge from-layer="6538" from-port="0" to-layer="6540" to-port="2" /> + <edge from-layer="6539" from-port="0" to-layer="6540" to-port="3" /> + <edge from-layer="6540" from-port="4" to-layer="6541" to-port="1" /> + <edge from-layer="6541" from-port="2" to-layer="6542" to-port="0" /> + <edge from-layer="6542" from-port="1" to-layer="6544" to-port="0" /> + <edge from-layer="6543" from-port="0" to-layer="6544" to-port="2" /> + <edge from-layer="6544" from-port="3" to-layer="6551" to-port="0" /> + <edge from-layer="6545" from-port="0" to-layer="6548" to-port="1" /> + <edge from-layer="6546" from-port="0" to-layer="6548" to-port="2" /> + <edge from-layer="6547" from-port="0" to-layer="6548" to-port="3" /> + <edge from-layer="6548" from-port="4" to-layer="6550" to-port="0" /> + <edge from-layer="6549" from-port="0" to-layer="6550" to-port="1" /> + <edge from-layer="6550" from-port="2" to-layer="6551" to-port="1" /> + <edge from-layer="6551" from-port="2" to-layer="7197" to-port="0" /> + <edge from-layer="6551" from-port="2" to-layer="6596" to-port="2" /> + <edge from-layer="6552" from-port="0" to-layer="6574" to-port="0" /> + <edge from-layer="6553" from-port="0" to-layer="6568" to-port="0" /> + <edge from-layer="6554" from-port="0" to-layer="6568" to-port="1" /> + <edge from-layer="6554" from-port="0" to-layer="6572" to-port="1" /> + <edge from-layer="6555" from-port="1" to-layer="6558" to-port="0" /> + <edge from-layer="6556" from-port="0" to-layer="6558" to-port="1" /> + <edge from-layer="6557" from-port="0" to-layer="6558" to-port="2" /> + <edge from-layer="6558" from-port="3" to-layer="6559" to-port="1" /> + <edge from-layer="6559" from-port="2" to-layer="6564" to-port="0" /> + <edge from-layer="6559" from-port="2" to-layer="6571" to-port="0" /> + <edge from-layer="6560" from-port="1" to-layer="6563" to-port="0" /> + <edge from-layer="6560" from-port="1" to-layer="6589" to-port="0" /> + <edge from-layer="6561" from-port="0" to-layer="6563" to-port="1" /> + <edge from-layer="6562" from-port="0" to-layer="6563" to-port="2" /> + <edge from-layer="6563" from-port="3" to-layer="6564" to-port="1" /> + <edge from-layer="6564" from-port="2" to-layer="6566" to-port="0" /> + <edge from-layer="6565" from-port="0" to-layer="6566" to-port="1" /> + <edge from-layer="6566" from-port="2" to-layer="6568" to-port="2" /> + <edge from-layer="6567" from-port="0" to-layer="6568" to-port="3" /> + <edge from-layer="6567" from-port="0" to-layer="6572" to-port="3" /> + <edge from-layer="6568" from-port="4" to-layer="6574" to-port="1" /> + <edge from-layer="6569" from-port="0" to-layer="6572" to-port="0" /> + <edge from-layer="6570" from-port="0" to-layer="6571" to-port="1" /> + <edge from-layer="6571" from-port="2" to-layer="6572" to-port="2" /> + <edge from-layer="6571" from-port="2" to-layer="6579" to-port="2" /> + <edge from-layer="6572" from-port="4" to-layer="6574" to-port="2" /> + <edge from-layer="6573" from-port="0" to-layer="6574" to-port="3" /> + <edge from-layer="6574" from-port="4" to-layer="6581" to-port="0" /> + <edge from-layer="6575" from-port="0" to-layer="6581" to-port="1" /> + <edge from-layer="6576" from-port="0" to-layer="6579" to-port="0" /> + <edge from-layer="6577" from-port="0" to-layer="6579" to-port="1" /> + <edge from-layer="6578" from-port="0" to-layer="6579" to-port="3" /> + <edge from-layer="6579" from-port="4" to-layer="6581" to-port="2" /> + <edge from-layer="6580" from-port="0" to-layer="6581" to-port="3" /> + <edge from-layer="6581" from-port="4" to-layer="6584" to-port="0" /> + <edge from-layer="6582" from-port="0" to-layer="6584" to-port="1" /> + <edge from-layer="6583" from-port="0" to-layer="6584" to-port="2" /> + <edge from-layer="6584" from-port="3" to-layer="6585" to-port="0" /> + <edge from-layer="6585" from-port="2" to-layer="6586" to-port="0" /> + <edge from-layer="6585" from-port="2" to-layer="6595" to-port="0" /> + <edge from-layer="6586" from-port="1" to-layer="6594" to-port="0" /> + <edge from-layer="6587" from-port="0" to-layer="6589" to-port="1" /> + <edge from-layer="6588" from-port="0" to-layer="6589" to-port="2" /> + <edge from-layer="6589" from-port="3" to-layer="6593" to-port="0" /> + <edge from-layer="6590" from-port="0" to-layer="6593" to-port="1" /> + <edge from-layer="6591" from-port="0" to-layer="6593" to-port="2" /> + <edge from-layer="6592" from-port="0" to-layer="6593" to-port="3" /> + <edge from-layer="6593" from-port="4" to-layer="6594" to-port="1" /> + <edge from-layer="6594" from-port="2" to-layer="6595" to-port="1" /> + <edge from-layer="6595" from-port="2" to-layer="6596" to-port="3" /> + <edge from-layer="6596" from-port="4" to-layer="6598" to-port="0" /> + <edge from-layer="6597" from-port="0" to-layer="6598" to-port="1" /> + <edge from-layer="6598" from-port="2" to-layer="6600" to-port="0" /> + <edge from-layer="6599" from-port="0" to-layer="6600" to-port="1" /> + <edge from-layer="6600" from-port="2" to-layer="6609" to-port="0" /> + <edge from-layer="6601" from-port="0" to-layer="6602" to-port="0" /> + <edge from-layer="6602" from-port="1" to-layer="6605" to-port="0" /> + <edge from-layer="6603" from-port="0" to-layer="6604" to-port="0" /> + <edge from-layer="6604" from-port="1" to-layer="6605" to-port="1" /> + <edge from-layer="6605" from-port="2" to-layer="6607" to-port="0" /> + <edge from-layer="6606" from-port="0" to-layer="6607" to-port="1" /> + <edge from-layer="6607" from-port="2" to-layer="6608" to-port="0" /> + <edge from-layer="6608" from-port="1" to-layer="6609" to-port="1" /> + <edge from-layer="6609" from-port="2" to-layer="6611" to-port="0" /> + <edge from-layer="6610" from-port="0" to-layer="6611" to-port="1" /> + <edge from-layer="6611" from-port="2" to-layer="6612" to-port="0" /> + <edge from-layer="6612" from-port="2" to-layer="6614" to-port="0" /> + <edge from-layer="6612" from-port="2" to-layer="6642" to-port="1" /> + <edge from-layer="6613" from-port="0" to-layer="6614" to-port="1" /> + <edge from-layer="6614" from-port="2" to-layer="6616" to-port="0" /> + <edge from-layer="6615" from-port="0" to-layer="6616" to-port="1" /> + <edge from-layer="6616" from-port="2" to-layer="6618" to-port="0" /> + <edge from-layer="6617" from-port="0" to-layer="6618" to-port="1" /> + <edge from-layer="6618" from-port="2" to-layer="6627" to-port="0" /> + <edge from-layer="6619" from-port="0" to-layer="6620" to-port="0" /> + <edge from-layer="6620" from-port="1" to-layer="6623" to-port="0" /> + <edge from-layer="6621" from-port="0" to-layer="6622" to-port="0" /> + <edge from-layer="6622" from-port="1" to-layer="6623" to-port="1" /> + <edge from-layer="6623" from-port="2" to-layer="6625" to-port="0" /> + <edge from-layer="6624" from-port="0" to-layer="6625" to-port="1" /> + <edge from-layer="6625" from-port="2" to-layer="6626" to-port="0" /> + <edge from-layer="6626" from-port="1" to-layer="6627" to-port="1" /> + <edge from-layer="6627" from-port="2" to-layer="6629" to-port="0" /> + <edge from-layer="6628" from-port="0" to-layer="6629" to-port="1" /> + <edge from-layer="6629" from-port="2" to-layer="6630" to-port="0" /> + <edge from-layer="6630" from-port="1" to-layer="6639" to-port="0" /> + <edge from-layer="6631" from-port="0" to-layer="6632" to-port="0" /> + <edge from-layer="6632" from-port="1" to-layer="6635" to-port="0" /> + <edge from-layer="6633" from-port="0" to-layer="6634" to-port="0" /> + <edge from-layer="6634" from-port="1" to-layer="6635" to-port="1" /> + <edge from-layer="6635" from-port="2" to-layer="6637" to-port="0" /> + <edge from-layer="6636" from-port="0" to-layer="6637" to-port="1" /> + <edge from-layer="6637" from-port="2" to-layer="6638" to-port="0" /> + <edge from-layer="6638" from-port="1" to-layer="6639" to-port="1" /> + <edge from-layer="6639" from-port="2" to-layer="6641" to-port="0" /> + <edge from-layer="6640" from-port="0" to-layer="6641" to-port="1" /> + <edge from-layer="6641" from-port="2" to-layer="6642" to-port="0" /> + <edge from-layer="6642" from-port="2" to-layer="6839" to-port="1" /> + <edge from-layer="6642" from-port="2" to-layer="6644" to-port="0" /> + <edge from-layer="6643" from-port="0" to-layer="6644" to-port="1" /> + <edge from-layer="6644" from-port="2" to-layer="6646" to-port="0" /> + <edge from-layer="6645" from-port="0" to-layer="6646" to-port="1" /> + <edge from-layer="6646" from-port="2" to-layer="6648" to-port="0" /> + <edge from-layer="6647" from-port="0" to-layer="6648" to-port="1" /> + <edge from-layer="6648" from-port="2" to-layer="6657" to-port="0" /> + <edge from-layer="6649" from-port="0" to-layer="6650" to-port="0" /> + <edge from-layer="6650" from-port="1" to-layer="6653" to-port="0" /> + <edge from-layer="6651" from-port="0" to-layer="6652" to-port="0" /> + <edge from-layer="6652" from-port="1" to-layer="6653" to-port="1" /> + <edge from-layer="6653" from-port="2" to-layer="6655" to-port="0" /> + <edge from-layer="6654" from-port="0" to-layer="6655" to-port="1" /> + <edge from-layer="6655" from-port="2" to-layer="6656" to-port="0" /> + <edge from-layer="6656" from-port="1" to-layer="6657" to-port="1" /> + <edge from-layer="6657" from-port="2" to-layer="6659" to-port="0" /> + <edge from-layer="6658" from-port="0" to-layer="6659" to-port="1" /> + <edge from-layer="6659" from-port="2" to-layer="6661" to-port="0" /> + <edge from-layer="6660" from-port="0" to-layer="6661" to-port="1" /> + <edge from-layer="6661" from-port="2" to-layer="6677" to-port="0" /> + <edge from-layer="6661" from-port="2" to-layer="6665" to-port="0" /> + <edge from-layer="6661" from-port="2" to-layer="6775" to-port="0" /> + <edge from-layer="6662" from-port="0" to-layer="6665" to-port="1" /> + <edge from-layer="6663" from-port="0" to-layer="6665" to-port="2" /> + <edge from-layer="6664" from-port="0" to-layer="6665" to-port="3" /> + <edge from-layer="6665" from-port="4" to-layer="6667" to-port="0" /> + <edge from-layer="6666" from-port="0" to-layer="6667" to-port="1" /> + <edge from-layer="6667" from-port="2" to-layer="6671" to-port="0" /> + <edge from-layer="6668" from-port="0" to-layer="6671" to-port="1" /> + <edge from-layer="6669" from-port="0" to-layer="6671" to-port="2" /> + <edge from-layer="6670" from-port="0" to-layer="6671" to-port="3" /> + <edge from-layer="6671" from-port="4" to-layer="6722" to-port="0" /> + <edge from-layer="6671" from-port="4" to-layer="6703" to-port="0" /> + <edge from-layer="6671" from-port="4" to-layer="6717" to-port="0" /> + <edge from-layer="6671" from-port="4" to-layer="6706" to-port="0" /> + <edge from-layer="6672" from-port="0" to-layer="6699" to-port="0" /> + <edge from-layer="6673" from-port="0" to-layer="6699" to-port="1" /> + <edge from-layer="6674" from-port="0" to-layer="6677" to-port="1" /> + <edge from-layer="6675" from-port="0" to-layer="6677" to-port="2" /> + <edge from-layer="6676" from-port="0" to-layer="6677" to-port="3" /> + <edge from-layer="6677" from-port="4" to-layer="6734" to-port="0" /> + <edge from-layer="6677" from-port="4" to-layer="6678" to-port="0" /> + <edge from-layer="6678" from-port="1" to-layer="6681" to-port="0" /> + <edge from-layer="6679" from-port="0" to-layer="6681" to-port="1" /> + <edge from-layer="6680" from-port="0" to-layer="6681" to-port="2" /> + <edge from-layer="6681" from-port="3" to-layer="6697" to-port="0" /> + <edge from-layer="6682" from-port="0" to-layer="6687" to-port="0" /> + <edge from-layer="6683" from-port="0" to-layer="6686" to-port="1" /> + <edge from-layer="6684" from-port="0" to-layer="6686" to-port="2" /> + <edge from-layer="6685" from-port="0" to-layer="6686" to-port="3" /> + <edge from-layer="6686" from-port="4" to-layer="6687" to-port="1" /> + <edge from-layer="6687" from-port="2" to-layer="6688" to-port="0" /> + <edge from-layer="6688" from-port="1" to-layer="6690" to-port="0" /> + <edge from-layer="6689" from-port="0" to-layer="6690" to-port="2" /> + <edge from-layer="6690" from-port="3" to-layer="6762" to-port="0" /> + <edge from-layer="6690" from-port="3" to-layer="6691" to-port="0" /> + <edge from-layer="6691" from-port="1" to-layer="6694" to-port="0" /> + <edge from-layer="6692" from-port="0" to-layer="6694" to-port="1" /> + <edge from-layer="6693" from-port="0" to-layer="6694" to-port="2" /> + <edge from-layer="6694" from-port="3" to-layer="6786" to-port="0" /> + <edge from-layer="6694" from-port="3" to-layer="6696" to-port="0" /> + <edge from-layer="6695" from-port="0" to-layer="6696" to-port="1" /> + <edge from-layer="6696" from-port="2" to-layer="6697" to-port="1" /> + <edge from-layer="6697" from-port="2" to-layer="6727" to-port="2" /> + <edge from-layer="6697" from-port="2" to-layer="6699" to-port="2" /> + <edge from-layer="6698" from-port="0" to-layer="6699" to-port="3" /> + <edge from-layer="6699" from-port="4" to-layer="6701" to-port="0" /> + <edge from-layer="6700" from-port="0" to-layer="6701" to-port="2" /> + <edge from-layer="6701" from-port="3" to-layer="6702" to-port="0" /> + <edge from-layer="6702" from-port="2" to-layer="6739" to-port="1" /> + <edge from-layer="6702" from-port="2" to-layer="6703" to-port="1" /> + <edge from-layer="6703" from-port="2" to-layer="6732" to-port="0" /> + <edge from-layer="6704" from-port="0" to-layer="6714" to-port="0" /> + <edge from-layer="6705" from-port="0" to-layer="6714" to-port="1" /> + <edge from-layer="6706" from-port="1" to-layer="6708" to-port="0" /> + <edge from-layer="6707" from-port="0" to-layer="6708" to-port="2" /> + <edge from-layer="6708" from-port="3" to-layer="6709" to-port="0" /> + <edge from-layer="6709" from-port="2" to-layer="6710" to-port="0" /> + <edge from-layer="6710" from-port="1" to-layer="6712" to-port="0" /> + <edge from-layer="6711" from-port="0" to-layer="6712" to-port="1" /> + <edge from-layer="6712" from-port="2" to-layer="6714" to-port="2" /> + <edge from-layer="6713" from-port="0" to-layer="6714" to-port="3" /> + <edge from-layer="6714" from-port="4" to-layer="6717" to-port="1" /> + <edge from-layer="6714" from-port="4" to-layer="6722" to-port="2" /> + <edge from-layer="6715" from-port="0" to-layer="6717" to-port="2" /> + <edge from-layer="6716" from-port="0" to-layer="6717" to-port="3" /> + <edge from-layer="6717" from-port="4" to-layer="6719" to-port="0" /> + <edge from-layer="6718" from-port="0" to-layer="6719" to-port="1" /> + <edge from-layer="6719" from-port="2" to-layer="6723" to-port="0" /> + <edge from-layer="6720" from-port="0" to-layer="6722" to-port="1" /> + <edge from-layer="6721" from-port="0" to-layer="6722" to-port="3" /> + <edge from-layer="6722" from-port="4" to-layer="6723" to-port="1" /> + <edge from-layer="6723" from-port="2" to-layer="6731" to-port="0" /> + <edge from-layer="6724" from-port="0" to-layer="6727" to-port="0" /> + <edge from-layer="6725" from-port="0" to-layer="6727" to-port="1" /> + <edge from-layer="6726" from-port="0" to-layer="6727" to-port="3" /> + <edge from-layer="6727" from-port="4" to-layer="6729" to-port="0" /> + <edge from-layer="6728" from-port="0" to-layer="6729" to-port="2" /> + <edge from-layer="6729" from-port="3" to-layer="6730" to-port="0" /> + <edge from-layer="6730" from-port="2" to-layer="6731" to-port="1" /> + <edge from-layer="6730" from-port="2" to-layer="6760" to-port="1" /> + <edge from-layer="6731" from-port="2" to-layer="6732" to-port="1" /> + <edge from-layer="6732" from-port="2" to-layer="6823" to-port="0" /> + <edge from-layer="6732" from-port="2" to-layer="6787" to-port="0" /> + <edge from-layer="6733" from-port="0" to-layer="6734" to-port="1" /> + <edge from-layer="6734" from-port="2" to-layer="6738" to-port="0" /> + <edge from-layer="6735" from-port="0" to-layer="6738" to-port="1" /> + <edge from-layer="6736" from-port="0" to-layer="6738" to-port="2" /> + <edge from-layer="6737" from-port="0" to-layer="6738" to-port="3" /> + <edge from-layer="6738" from-port="4" to-layer="6758" to-port="0" /> + <edge from-layer="6738" from-port="4" to-layer="6753" to-port="0" /> + <edge from-layer="6738" from-port="4" to-layer="6742" to-port="0" /> + <edge from-layer="6738" from-port="4" to-layer="6739" to-port="0" /> + <edge from-layer="6739" from-port="2" to-layer="6761" to-port="0" /> + <edge from-layer="6740" from-port="0" to-layer="6750" to-port="0" /> + <edge from-layer="6741" from-port="0" to-layer="6750" to-port="1" /> + <edge from-layer="6742" from-port="1" to-layer="6744" to-port="0" /> + <edge from-layer="6743" from-port="0" to-layer="6744" to-port="2" /> + <edge from-layer="6744" from-port="3" to-layer="6745" to-port="0" /> + <edge from-layer="6745" from-port="2" to-layer="6746" to-port="0" /> + <edge from-layer="6746" from-port="1" to-layer="6748" to-port="0" /> + <edge from-layer="6747" from-port="0" to-layer="6748" to-port="1" /> + <edge from-layer="6748" from-port="2" to-layer="6750" to-port="2" /> + <edge from-layer="6749" from-port="0" to-layer="6750" to-port="3" /> + <edge from-layer="6750" from-port="4" to-layer="6753" to-port="1" /> + <edge from-layer="6750" from-port="4" to-layer="6758" to-port="2" /> + <edge from-layer="6751" from-port="0" to-layer="6753" to-port="2" /> + <edge from-layer="6752" from-port="0" to-layer="6753" to-port="3" /> + <edge from-layer="6753" from-port="4" to-layer="6755" to-port="0" /> + <edge from-layer="6754" from-port="0" to-layer="6755" to-port="1" /> + <edge from-layer="6755" from-port="2" to-layer="6759" to-port="0" /> + <edge from-layer="6756" from-port="0" to-layer="6758" to-port="1" /> + <edge from-layer="6757" from-port="0" to-layer="6758" to-port="3" /> + <edge from-layer="6758" from-port="4" to-layer="6759" to-port="1" /> + <edge from-layer="6759" from-port="2" to-layer="6760" to-port="0" /> + <edge from-layer="6760" from-port="2" to-layer="6761" to-port="1" /> + <edge from-layer="6761" from-port="2" to-layer="6782" to-port="0" /> + <edge from-layer="6761" from-port="2" to-layer="6762" to-port="1" /> + <edge from-layer="6762" from-port="2" to-layer="6823" to-port="1" /> + <edge from-layer="6762" from-port="2" to-layer="7196" to-port="0" /> + <edge from-layer="6763" from-port="0" to-layer="6768" to-port="0" /> + <edge from-layer="6764" from-port="0" to-layer="6767" to-port="1" /> + <edge from-layer="6765" from-port="0" to-layer="6767" to-port="2" /> + <edge from-layer="6766" from-port="0" to-layer="6767" to-port="3" /> + <edge from-layer="6767" from-port="4" to-layer="6768" to-port="1" /> + <edge from-layer="6768" from-port="2" to-layer="6769" to-port="0" /> + <edge from-layer="6769" from-port="1" to-layer="6771" to-port="0" /> + <edge from-layer="6770" from-port="0" to-layer="6771" to-port="2" /> + <edge from-layer="6771" from-port="3" to-layer="6778" to-port="0" /> + <edge from-layer="6772" from-port="0" to-layer="6775" to-port="1" /> + <edge from-layer="6773" from-port="0" to-layer="6775" to-port="2" /> + <edge from-layer="6774" from-port="0" to-layer="6775" to-port="3" /> + <edge from-layer="6775" from-port="4" to-layer="6777" to-port="0" /> + <edge from-layer="6776" from-port="0" to-layer="6777" to-port="1" /> + <edge from-layer="6777" from-port="2" to-layer="6778" to-port="1" /> + <edge from-layer="6778" from-port="2" to-layer="6823" to-port="2" /> + <edge from-layer="6778" from-port="2" to-layer="7195" to-port="0" /> + <edge from-layer="6779" from-port="0" to-layer="6801" to-port="0" /> + <edge from-layer="6780" from-port="0" to-layer="6795" to-port="0" /> + <edge from-layer="6781" from-port="0" to-layer="6795" to-port="1" /> + <edge from-layer="6781" from-port="0" to-layer="6799" to-port="1" /> + <edge from-layer="6782" from-port="1" to-layer="6785" to-port="0" /> + <edge from-layer="6783" from-port="0" to-layer="6785" to-port="1" /> + <edge from-layer="6784" from-port="0" to-layer="6785" to-port="2" /> + <edge from-layer="6785" from-port="3" to-layer="6786" to-port="1" /> + <edge from-layer="6786" from-port="2" to-layer="6798" to-port="0" /> + <edge from-layer="6786" from-port="2" to-layer="6791" to-port="0" /> + <edge from-layer="6787" from-port="1" to-layer="6816" to-port="0" /> + <edge from-layer="6787" from-port="1" to-layer="6790" to-port="0" /> + <edge from-layer="6788" from-port="0" to-layer="6790" to-port="1" /> + <edge from-layer="6789" from-port="0" to-layer="6790" to-port="2" /> + <edge from-layer="6790" from-port="3" to-layer="6791" to-port="1" /> + <edge from-layer="6791" from-port="2" to-layer="6793" to-port="0" /> + <edge from-layer="6792" from-port="0" to-layer="6793" to-port="1" /> + <edge from-layer="6793" from-port="2" to-layer="6795" to-port="2" /> + <edge from-layer="6794" from-port="0" to-layer="6799" to-port="3" /> + <edge from-layer="6794" from-port="0" to-layer="6795" to-port="3" /> + <edge from-layer="6795" from-port="4" to-layer="6801" to-port="1" /> + <edge from-layer="6796" from-port="0" to-layer="6799" to-port="0" /> + <edge from-layer="6797" from-port="0" to-layer="6798" to-port="1" /> + <edge from-layer="6798" from-port="2" to-layer="6799" to-port="2" /> + <edge from-layer="6798" from-port="2" to-layer="6806" to-port="2" /> + <edge from-layer="6799" from-port="4" to-layer="6801" to-port="2" /> + <edge from-layer="6800" from-port="0" to-layer="6801" to-port="3" /> + <edge from-layer="6801" from-port="4" to-layer="6808" to-port="0" /> + <edge from-layer="6802" from-port="0" to-layer="6808" to-port="1" /> + <edge from-layer="6803" from-port="0" to-layer="6806" to-port="0" /> + <edge from-layer="6804" from-port="0" to-layer="6806" to-port="1" /> + <edge from-layer="6805" from-port="0" to-layer="6806" to-port="3" /> + <edge from-layer="6806" from-port="4" to-layer="6808" to-port="2" /> + <edge from-layer="6807" from-port="0" to-layer="6808" to-port="3" /> + <edge from-layer="6808" from-port="4" to-layer="6811" to-port="0" /> + <edge from-layer="6809" from-port="0" to-layer="6811" to-port="1" /> + <edge from-layer="6810" from-port="0" to-layer="6811" to-port="2" /> + <edge from-layer="6811" from-port="3" to-layer="6812" to-port="0" /> + <edge from-layer="6812" from-port="2" to-layer="6813" to-port="0" /> + <edge from-layer="6812" from-port="2" to-layer="6822" to-port="0" /> + <edge from-layer="6813" from-port="1" to-layer="6821" to-port="0" /> + <edge from-layer="6814" from-port="0" to-layer="6816" to-port="1" /> + <edge from-layer="6815" from-port="0" to-layer="6816" to-port="2" /> + <edge from-layer="6816" from-port="3" to-layer="6820" to-port="0" /> + <edge from-layer="6817" from-port="0" to-layer="6820" to-port="1" /> + <edge from-layer="6818" from-port="0" to-layer="6820" to-port="2" /> + <edge from-layer="6819" from-port="0" to-layer="6820" to-port="3" /> + <edge from-layer="6820" from-port="4" to-layer="6821" to-port="1" /> + <edge from-layer="6821" from-port="2" to-layer="6822" to-port="1" /> + <edge from-layer="6822" from-port="2" to-layer="6823" to-port="3" /> + <edge from-layer="6823" from-port="4" to-layer="6825" to-port="0" /> + <edge from-layer="6824" from-port="0" to-layer="6825" to-port="1" /> + <edge from-layer="6825" from-port="2" to-layer="6827" to-port="0" /> + <edge from-layer="6826" from-port="0" to-layer="6827" to-port="1" /> + <edge from-layer="6827" from-port="2" to-layer="6836" to-port="0" /> + <edge from-layer="6828" from-port="0" to-layer="6829" to-port="0" /> + <edge from-layer="6829" from-port="1" to-layer="6832" to-port="0" /> + <edge from-layer="6830" from-port="0" to-layer="6831" to-port="0" /> + <edge from-layer="6831" from-port="1" to-layer="6832" to-port="1" /> + <edge from-layer="6832" from-port="2" to-layer="6834" to-port="0" /> + <edge from-layer="6833" from-port="0" to-layer="6834" to-port="1" /> + <edge from-layer="6834" from-port="2" to-layer="6835" to-port="0" /> + <edge from-layer="6835" from-port="1" to-layer="6836" to-port="1" /> + <edge from-layer="6836" from-port="2" to-layer="6838" to-port="0" /> + <edge from-layer="6837" from-port="0" to-layer="6838" to-port="1" /> + <edge from-layer="6838" from-port="2" to-layer="6839" to-port="0" /> + <edge from-layer="6839" from-port="2" to-layer="6869" to-port="1" /> + <edge from-layer="6839" from-port="2" to-layer="6841" to-port="0" /> + <edge from-layer="6840" from-port="0" to-layer="6841" to-port="1" /> + <edge from-layer="6841" from-port="2" to-layer="6843" to-port="0" /> + <edge from-layer="6842" from-port="0" to-layer="6843" to-port="1" /> + <edge from-layer="6843" from-port="2" to-layer="6845" to-port="0" /> + <edge from-layer="6844" from-port="0" to-layer="6845" to-port="1" /> + <edge from-layer="6845" from-port="2" to-layer="6854" to-port="0" /> + <edge from-layer="6846" from-port="0" to-layer="6847" to-port="0" /> + <edge from-layer="6847" from-port="1" to-layer="6850" to-port="0" /> + <edge from-layer="6848" from-port="0" to-layer="6849" to-port="0" /> + <edge from-layer="6849" from-port="1" to-layer="6850" to-port="1" /> + <edge from-layer="6850" from-port="2" to-layer="6852" to-port="0" /> + <edge from-layer="6851" from-port="0" to-layer="6852" to-port="1" /> + <edge from-layer="6852" from-port="2" to-layer="6853" to-port="0" /> + <edge from-layer="6853" from-port="1" to-layer="6854" to-port="1" /> + <edge from-layer="6854" from-port="2" to-layer="6856" to-port="0" /> + <edge from-layer="6855" from-port="0" to-layer="6856" to-port="1" /> + <edge from-layer="6856" from-port="2" to-layer="6857" to-port="0" /> + <edge from-layer="6857" from-port="1" to-layer="6866" to-port="0" /> + <edge from-layer="6858" from-port="0" to-layer="6859" to-port="0" /> + <edge from-layer="6859" from-port="1" to-layer="6862" to-port="0" /> + <edge from-layer="6860" from-port="0" to-layer="6861" to-port="0" /> + <edge from-layer="6861" from-port="1" to-layer="6862" to-port="1" /> + <edge from-layer="6862" from-port="2" to-layer="6864" to-port="0" /> + <edge from-layer="6863" from-port="0" to-layer="6864" to-port="1" /> + <edge from-layer="6864" from-port="2" to-layer="6865" to-port="0" /> + <edge from-layer="6865" from-port="1" to-layer="6866" to-port="1" /> + <edge from-layer="6866" from-port="2" to-layer="6868" to-port="0" /> + <edge from-layer="6867" from-port="0" to-layer="6868" to-port="1" /> + <edge from-layer="6868" from-port="2" to-layer="6869" to-port="0" /> + <edge from-layer="6869" from-port="2" to-layer="7066" to-port="1" /> + <edge from-layer="6869" from-port="2" to-layer="6871" to-port="0" /> + <edge from-layer="6870" from-port="0" to-layer="6871" to-port="1" /> + <edge from-layer="6871" from-port="2" to-layer="6873" to-port="0" /> + <edge from-layer="6872" from-port="0" to-layer="6873" to-port="1" /> + <edge from-layer="6873" from-port="2" to-layer="6875" to-port="0" /> + <edge from-layer="6874" from-port="0" to-layer="6875" to-port="1" /> + <edge from-layer="6875" from-port="2" to-layer="6884" to-port="0" /> + <edge from-layer="6876" from-port="0" to-layer="6877" to-port="0" /> + <edge from-layer="6877" from-port="1" to-layer="6880" to-port="0" /> + <edge from-layer="6878" from-port="0" to-layer="6879" to-port="0" /> + <edge from-layer="6879" from-port="1" to-layer="6880" to-port="1" /> + <edge from-layer="6880" from-port="2" to-layer="6882" to-port="0" /> + <edge from-layer="6881" from-port="0" to-layer="6882" to-port="1" /> + <edge from-layer="6882" from-port="2" to-layer="6883" to-port="0" /> + <edge from-layer="6883" from-port="1" to-layer="6884" to-port="1" /> + <edge from-layer="6884" from-port="2" to-layer="6886" to-port="0" /> + <edge from-layer="6885" from-port="0" to-layer="6886" to-port="1" /> + <edge from-layer="6886" from-port="2" to-layer="6888" to-port="0" /> + <edge from-layer="6887" from-port="0" to-layer="6888" to-port="1" /> + <edge from-layer="6888" from-port="2" to-layer="7002" to-port="0" /> + <edge from-layer="6888" from-port="2" to-layer="6892" to-port="0" /> + <edge from-layer="6888" from-port="2" to-layer="6904" to-port="0" /> + <edge from-layer="6889" from-port="0" to-layer="6892" to-port="1" /> + <edge from-layer="6890" from-port="0" to-layer="6892" to-port="2" /> + <edge from-layer="6891" from-port="0" to-layer="6892" to-port="3" /> + <edge from-layer="6892" from-port="4" to-layer="6894" to-port="0" /> + <edge from-layer="6893" from-port="0" to-layer="6894" to-port="1" /> + <edge from-layer="6894" from-port="2" to-layer="6898" to-port="0" /> + <edge from-layer="6895" from-port="0" to-layer="6898" to-port="1" /> + <edge from-layer="6896" from-port="0" to-layer="6898" to-port="2" /> + <edge from-layer="6897" from-port="0" to-layer="6898" to-port="3" /> + <edge from-layer="6898" from-port="4" to-layer="6944" to-port="0" /> + <edge from-layer="6898" from-port="4" to-layer="6930" to-port="0" /> + <edge from-layer="6898" from-port="4" to-layer="6933" to-port="0" /> + <edge from-layer="6898" from-port="4" to-layer="6949" to-port="0" /> + <edge from-layer="6899" from-port="0" to-layer="6926" to-port="0" /> + <edge from-layer="6900" from-port="0" to-layer="6926" to-port="1" /> + <edge from-layer="6901" from-port="0" to-layer="6904" to-port="1" /> + <edge from-layer="6902" from-port="0" to-layer="6904" to-port="2" /> + <edge from-layer="6903" from-port="0" to-layer="6904" to-port="3" /> + <edge from-layer="6904" from-port="4" to-layer="6961" to-port="0" /> + <edge from-layer="6904" from-port="4" to-layer="6905" to-port="0" /> + <edge from-layer="6905" from-port="1" to-layer="6908" to-port="0" /> + <edge from-layer="6906" from-port="0" to-layer="6908" to-port="1" /> + <edge from-layer="6907" from-port="0" to-layer="6908" to-port="2" /> + <edge from-layer="6908" from-port="3" to-layer="6924" to-port="0" /> + <edge from-layer="6909" from-port="0" to-layer="6914" to-port="0" /> + <edge from-layer="6910" from-port="0" to-layer="6913" to-port="1" /> + <edge from-layer="6911" from-port="0" to-layer="6913" to-port="2" /> + <edge from-layer="6912" from-port="0" to-layer="6913" to-port="3" /> + <edge from-layer="6913" from-port="4" to-layer="6914" to-port="1" /> + <edge from-layer="6914" from-port="2" to-layer="6915" to-port="0" /> + <edge from-layer="6915" from-port="1" to-layer="6917" to-port="0" /> + <edge from-layer="6916" from-port="0" to-layer="6917" to-port="2" /> + <edge from-layer="6917" from-port="3" to-layer="6989" to-port="0" /> + <edge from-layer="6917" from-port="3" to-layer="6918" to-port="0" /> + <edge from-layer="6918" from-port="1" to-layer="6921" to-port="0" /> + <edge from-layer="6919" from-port="0" to-layer="6921" to-port="1" /> + <edge from-layer="6920" from-port="0" to-layer="6921" to-port="2" /> + <edge from-layer="6921" from-port="3" to-layer="7013" to-port="0" /> + <edge from-layer="6921" from-port="3" to-layer="6923" to-port="0" /> + <edge from-layer="6922" from-port="0" to-layer="6923" to-port="1" /> + <edge from-layer="6923" from-port="2" to-layer="6924" to-port="1" /> + <edge from-layer="6924" from-port="2" to-layer="6954" to-port="2" /> + <edge from-layer="6924" from-port="2" to-layer="6926" to-port="2" /> + <edge from-layer="6925" from-port="0" to-layer="6926" to-port="3" /> + <edge from-layer="6926" from-port="4" to-layer="6928" to-port="0" /> + <edge from-layer="6927" from-port="0" to-layer="6928" to-port="2" /> + <edge from-layer="6928" from-port="3" to-layer="6929" to-port="0" /> + <edge from-layer="6929" from-port="2" to-layer="6966" to-port="1" /> + <edge from-layer="6929" from-port="2" to-layer="6930" to-port="1" /> + <edge from-layer="6930" from-port="2" to-layer="6959" to-port="0" /> + <edge from-layer="6931" from-port="0" to-layer="6941" to-port="0" /> + <edge from-layer="6932" from-port="0" to-layer="6941" to-port="1" /> + <edge from-layer="6933" from-port="1" to-layer="6935" to-port="0" /> + <edge from-layer="6934" from-port="0" to-layer="6935" to-port="2" /> + <edge from-layer="6935" from-port="3" to-layer="6936" to-port="0" /> + <edge from-layer="6936" from-port="2" to-layer="6937" to-port="0" /> + <edge from-layer="6937" from-port="1" to-layer="6939" to-port="0" /> + <edge from-layer="6938" from-port="0" to-layer="6939" to-port="1" /> + <edge from-layer="6939" from-port="2" to-layer="6941" to-port="2" /> + <edge from-layer="6940" from-port="0" to-layer="6941" to-port="3" /> + <edge from-layer="6941" from-port="4" to-layer="6944" to-port="1" /> + <edge from-layer="6941" from-port="4" to-layer="6949" to-port="2" /> + <edge from-layer="6942" from-port="0" to-layer="6944" to-port="2" /> + <edge from-layer="6943" from-port="0" to-layer="6944" to-port="3" /> + <edge from-layer="6944" from-port="4" to-layer="6946" to-port="0" /> + <edge from-layer="6945" from-port="0" to-layer="6946" to-port="1" /> + <edge from-layer="6946" from-port="2" to-layer="6950" to-port="0" /> + <edge from-layer="6947" from-port="0" to-layer="6949" to-port="1" /> + <edge from-layer="6948" from-port="0" to-layer="6949" to-port="3" /> + <edge from-layer="6949" from-port="4" to-layer="6950" to-port="1" /> + <edge from-layer="6950" from-port="2" to-layer="6958" to-port="0" /> + <edge from-layer="6951" from-port="0" to-layer="6954" to-port="0" /> + <edge from-layer="6952" from-port="0" to-layer="6954" to-port="1" /> + <edge from-layer="6953" from-port="0" to-layer="6954" to-port="3" /> + <edge from-layer="6954" from-port="4" to-layer="6956" to-port="0" /> + <edge from-layer="6955" from-port="0" to-layer="6956" to-port="2" /> + <edge from-layer="6956" from-port="3" to-layer="6957" to-port="0" /> + <edge from-layer="6957" from-port="2" to-layer="6987" to-port="1" /> + <edge from-layer="6957" from-port="2" to-layer="6958" to-port="1" /> + <edge from-layer="6958" from-port="2" to-layer="6959" to-port="1" /> + <edge from-layer="6959" from-port="2" to-layer="7050" to-port="0" /> + <edge from-layer="6959" from-port="2" to-layer="7014" to-port="0" /> + <edge from-layer="6960" from-port="0" to-layer="6961" to-port="1" /> + <edge from-layer="6961" from-port="2" to-layer="6965" to-port="0" /> + <edge from-layer="6962" from-port="0" to-layer="6965" to-port="1" /> + <edge from-layer="6963" from-port="0" to-layer="6965" to-port="2" /> + <edge from-layer="6964" from-port="0" to-layer="6965" to-port="3" /> + <edge from-layer="6965" from-port="4" to-layer="6980" to-port="0" /> + <edge from-layer="6965" from-port="4" to-layer="6985" to-port="0" /> + <edge from-layer="6965" from-port="4" to-layer="6969" to-port="0" /> + <edge from-layer="6965" from-port="4" to-layer="6966" to-port="0" /> + <edge from-layer="6966" from-port="2" to-layer="6988" to-port="0" /> + <edge from-layer="6967" from-port="0" to-layer="6977" to-port="0" /> + <edge from-layer="6968" from-port="0" to-layer="6977" to-port="1" /> + <edge from-layer="6969" from-port="1" to-layer="6971" to-port="0" /> + <edge from-layer="6970" from-port="0" to-layer="6971" to-port="2" /> + <edge from-layer="6971" from-port="3" to-layer="6972" to-port="0" /> + <edge from-layer="6972" from-port="2" to-layer="6973" to-port="0" /> + <edge from-layer="6973" from-port="1" to-layer="6975" to-port="0" /> + <edge from-layer="6974" from-port="0" to-layer="6975" to-port="1" /> + <edge from-layer="6975" from-port="2" to-layer="6977" to-port="2" /> + <edge from-layer="6976" from-port="0" to-layer="6977" to-port="3" /> + <edge from-layer="6977" from-port="4" to-layer="6985" to-port="2" /> + <edge from-layer="6977" from-port="4" to-layer="6980" to-port="1" /> + <edge from-layer="6978" from-port="0" to-layer="6980" to-port="2" /> + <edge from-layer="6979" from-port="0" to-layer="6980" to-port="3" /> + <edge from-layer="6980" from-port="4" to-layer="6982" to-port="0" /> + <edge from-layer="6981" from-port="0" to-layer="6982" to-port="1" /> + <edge from-layer="6982" from-port="2" to-layer="6986" to-port="0" /> + <edge from-layer="6983" from-port="0" to-layer="6985" to-port="1" /> + <edge from-layer="6984" from-port="0" to-layer="6985" to-port="3" /> + <edge from-layer="6985" from-port="4" to-layer="6986" to-port="1" /> + <edge from-layer="6986" from-port="2" to-layer="6987" to-port="0" /> + <edge from-layer="6987" from-port="2" to-layer="6988" to-port="1" /> + <edge from-layer="6988" from-port="2" to-layer="7009" to-port="0" /> + <edge from-layer="6988" from-port="2" to-layer="6989" to-port="1" /> + <edge from-layer="6989" from-port="2" to-layer="7192" to-port="0" /> + <edge from-layer="6989" from-port="2" to-layer="7050" to-port="1" /> + <edge from-layer="6990" from-port="0" to-layer="6995" to-port="0" /> + <edge from-layer="6991" from-port="0" to-layer="6994" to-port="1" /> + <edge from-layer="6992" from-port="0" to-layer="6994" to-port="2" /> + <edge from-layer="6993" from-port="0" to-layer="6994" to-port="3" /> + <edge from-layer="6994" from-port="4" to-layer="6995" to-port="1" /> + <edge from-layer="6995" from-port="2" to-layer="6996" to-port="0" /> + <edge from-layer="6996" from-port="1" to-layer="6998" to-port="0" /> + <edge from-layer="6997" from-port="0" to-layer="6998" to-port="2" /> + <edge from-layer="6998" from-port="3" to-layer="7005" to-port="0" /> + <edge from-layer="6999" from-port="0" to-layer="7002" to-port="1" /> + <edge from-layer="7000" from-port="0" to-layer="7002" to-port="2" /> + <edge from-layer="7001" from-port="0" to-layer="7002" to-port="3" /> + <edge from-layer="7002" from-port="4" to-layer="7004" to-port="0" /> + <edge from-layer="7003" from-port="0" to-layer="7004" to-port="1" /> + <edge from-layer="7004" from-port="2" to-layer="7005" to-port="1" /> + <edge from-layer="7005" from-port="2" to-layer="7050" to-port="2" /> + <edge from-layer="7005" from-port="2" to-layer="7191" to-port="0" /> + <edge from-layer="7006" from-port="0" to-layer="7028" to-port="0" /> + <edge from-layer="7007" from-port="0" to-layer="7022" to-port="0" /> + <edge from-layer="7008" from-port="0" to-layer="7026" to-port="1" /> + <edge from-layer="7008" from-port="0" to-layer="7022" to-port="1" /> + <edge from-layer="7009" from-port="1" to-layer="7012" to-port="0" /> + <edge from-layer="7010" from-port="0" to-layer="7012" to-port="1" /> + <edge from-layer="7011" from-port="0" to-layer="7012" to-port="2" /> + <edge from-layer="7012" from-port="3" to-layer="7013" to-port="1" /> + <edge from-layer="7013" from-port="2" to-layer="7018" to-port="0" /> + <edge from-layer="7013" from-port="2" to-layer="7025" to-port="0" /> + <edge from-layer="7014" from-port="1" to-layer="7043" to-port="0" /> + <edge from-layer="7014" from-port="1" to-layer="7017" to-port="0" /> + <edge from-layer="7015" from-port="0" to-layer="7017" to-port="1" /> + <edge from-layer="7016" from-port="0" to-layer="7017" to-port="2" /> + <edge from-layer="7017" from-port="3" to-layer="7018" to-port="1" /> + <edge from-layer="7018" from-port="2" to-layer="7020" to-port="0" /> + <edge from-layer="7019" from-port="0" to-layer="7020" to-port="1" /> + <edge from-layer="7020" from-port="2" to-layer="7022" to-port="2" /> + <edge from-layer="7021" from-port="0" to-layer="7026" to-port="3" /> + <edge from-layer="7021" from-port="0" to-layer="7022" to-port="3" /> + <edge from-layer="7022" from-port="4" to-layer="7028" to-port="1" /> + <edge from-layer="7023" from-port="0" to-layer="7026" to-port="0" /> + <edge from-layer="7024" from-port="0" to-layer="7025" to-port="1" /> + <edge from-layer="7025" from-port="2" to-layer="7033" to-port="2" /> + <edge from-layer="7025" from-port="2" to-layer="7026" to-port="2" /> + <edge from-layer="7026" from-port="4" to-layer="7028" to-port="2" /> + <edge from-layer="7027" from-port="0" to-layer="7028" to-port="3" /> + <edge from-layer="7028" from-port="4" to-layer="7035" to-port="0" /> + <edge from-layer="7029" from-port="0" to-layer="7035" to-port="1" /> + <edge from-layer="7030" from-port="0" to-layer="7033" to-port="0" /> + <edge from-layer="7031" from-port="0" to-layer="7033" to-port="1" /> + <edge from-layer="7032" from-port="0" to-layer="7033" to-port="3" /> + <edge from-layer="7033" from-port="4" to-layer="7035" to-port="2" /> + <edge from-layer="7034" from-port="0" to-layer="7035" to-port="3" /> + <edge from-layer="7035" from-port="4" to-layer="7038" to-port="0" /> + <edge from-layer="7036" from-port="0" to-layer="7038" to-port="1" /> + <edge from-layer="7037" from-port="0" to-layer="7038" to-port="2" /> + <edge from-layer="7038" from-port="3" to-layer="7039" to-port="0" /> + <edge from-layer="7039" from-port="2" to-layer="7049" to-port="0" /> + <edge from-layer="7039" from-port="2" to-layer="7040" to-port="0" /> + <edge from-layer="7040" from-port="1" to-layer="7048" to-port="0" /> + <edge from-layer="7041" from-port="0" to-layer="7043" to-port="1" /> + <edge from-layer="7042" from-port="0" to-layer="7043" to-port="2" /> + <edge from-layer="7043" from-port="3" to-layer="7047" to-port="0" /> + <edge from-layer="7044" from-port="0" to-layer="7047" to-port="1" /> + <edge from-layer="7045" from-port="0" to-layer="7047" to-port="2" /> + <edge from-layer="7046" from-port="0" to-layer="7047" to-port="3" /> + <edge from-layer="7047" from-port="4" to-layer="7048" to-port="1" /> + <edge from-layer="7048" from-port="2" to-layer="7049" to-port="1" /> + <edge from-layer="7049" from-port="2" to-layer="7050" to-port="3" /> + <edge from-layer="7050" from-port="4" to-layer="7052" to-port="0" /> + <edge from-layer="7051" from-port="0" to-layer="7052" to-port="1" /> + <edge from-layer="7052" from-port="2" to-layer="7054" to-port="0" /> + <edge from-layer="7053" from-port="0" to-layer="7054" to-port="1" /> + <edge from-layer="7054" from-port="2" to-layer="7063" to-port="0" /> + <edge from-layer="7055" from-port="0" to-layer="7056" to-port="0" /> + <edge from-layer="7056" from-port="1" to-layer="7059" to-port="0" /> + <edge from-layer="7057" from-port="0" to-layer="7058" to-port="0" /> + <edge from-layer="7058" from-port="1" to-layer="7059" to-port="1" /> + <edge from-layer="7059" from-port="2" to-layer="7061" to-port="0" /> + <edge from-layer="7060" from-port="0" to-layer="7061" to-port="1" /> + <edge from-layer="7061" from-port="2" to-layer="7062" to-port="0" /> + <edge from-layer="7062" from-port="1" to-layer="7063" to-port="1" /> + <edge from-layer="7063" from-port="2" to-layer="7065" to-port="0" /> + <edge from-layer="7064" from-port="0" to-layer="7065" to-port="1" /> + <edge from-layer="7065" from-port="2" to-layer="7066" to-port="0" /> + <edge from-layer="7066" from-port="2" to-layer="7068" to-port="0" /> + <edge from-layer="7066" from-port="2" to-layer="7096" to-port="1" /> + <edge from-layer="7067" from-port="0" to-layer="7068" to-port="1" /> + <edge from-layer="7068" from-port="2" to-layer="7070" to-port="0" /> + <edge from-layer="7069" from-port="0" to-layer="7070" to-port="1" /> + <edge from-layer="7070" from-port="2" to-layer="7072" to-port="0" /> + <edge from-layer="7071" from-port="0" to-layer="7072" to-port="1" /> + <edge from-layer="7072" from-port="2" to-layer="7081" to-port="0" /> + <edge from-layer="7073" from-port="0" to-layer="7074" to-port="0" /> + <edge from-layer="7074" from-port="1" to-layer="7077" to-port="0" /> + <edge from-layer="7075" from-port="0" to-layer="7076" to-port="0" /> + <edge from-layer="7076" from-port="1" to-layer="7077" to-port="1" /> + <edge from-layer="7077" from-port="2" to-layer="7079" to-port="0" /> + <edge from-layer="7078" from-port="0" to-layer="7079" to-port="1" /> + <edge from-layer="7079" from-port="2" to-layer="7080" to-port="0" /> + <edge from-layer="7080" from-port="1" to-layer="7081" to-port="1" /> + <edge from-layer="7081" from-port="2" to-layer="7083" to-port="0" /> + <edge from-layer="7082" from-port="0" to-layer="7083" to-port="1" /> + <edge from-layer="7083" from-port="2" to-layer="7084" to-port="0" /> + <edge from-layer="7084" from-port="1" to-layer="7093" to-port="0" /> + <edge from-layer="7085" from-port="0" to-layer="7086" to-port="0" /> + <edge from-layer="7086" from-port="1" to-layer="7089" to-port="0" /> + <edge from-layer="7087" from-port="0" to-layer="7088" to-port="0" /> + <edge from-layer="7088" from-port="1" to-layer="7089" to-port="1" /> + <edge from-layer="7089" from-port="2" to-layer="7091" to-port="0" /> + <edge from-layer="7090" from-port="0" to-layer="7091" to-port="1" /> + <edge from-layer="7091" from-port="2" to-layer="7092" to-port="0" /> + <edge from-layer="7092" from-port="1" to-layer="7093" to-port="1" /> + <edge from-layer="7093" from-port="2" to-layer="7095" to-port="0" /> + <edge from-layer="7094" from-port="0" to-layer="7095" to-port="1" /> + <edge from-layer="7095" from-port="2" to-layer="7096" to-port="0" /> + <edge from-layer="7096" from-port="2" to-layer="7098" to-port="0" /> + <edge from-layer="7096" from-port="2" to-layer="7338" to-port="1" /> + <edge from-layer="7097" from-port="0" to-layer="7098" to-port="1" /> + <edge from-layer="7098" from-port="2" to-layer="7100" to-port="0" /> + <edge from-layer="7099" from-port="0" to-layer="7100" to-port="1" /> + <edge from-layer="7100" from-port="2" to-layer="7102" to-port="0" /> + <edge from-layer="7101" from-port="0" to-layer="7102" to-port="1" /> + <edge from-layer="7102" from-port="2" to-layer="7111" to-port="0" /> + <edge from-layer="7103" from-port="0" to-layer="7104" to-port="0" /> + <edge from-layer="7104" from-port="1" to-layer="7107" to-port="0" /> + <edge from-layer="7105" from-port="0" to-layer="7106" to-port="0" /> + <edge from-layer="7106" from-port="1" to-layer="7107" to-port="1" /> + <edge from-layer="7107" from-port="2" to-layer="7109" to-port="0" /> + <edge from-layer="7108" from-port="0" to-layer="7109" to-port="1" /> + <edge from-layer="7109" from-port="2" to-layer="7110" to-port="0" /> + <edge from-layer="7110" from-port="1" to-layer="7111" to-port="1" /> + <edge from-layer="7111" from-port="2" to-layer="7113" to-port="0" /> + <edge from-layer="7112" from-port="0" to-layer="7113" to-port="1" /> + <edge from-layer="7113" from-port="2" to-layer="7115" to-port="0" /> + <edge from-layer="7114" from-port="0" to-layer="7115" to-port="1" /> + <edge from-layer="7115" from-port="2" to-layer="7119" to-port="0" /> + <edge from-layer="7115" from-port="2" to-layer="7136" to-port="0" /> + <edge from-layer="7115" from-port="2" to-layer="7244" to-port="0" /> + <edge from-layer="7116" from-port="0" to-layer="7119" to-port="1" /> + <edge from-layer="7117" from-port="0" to-layer="7119" to-port="2" /> + <edge from-layer="7118" from-port="0" to-layer="7119" to-port="3" /> + <edge from-layer="7119" from-port="4" to-layer="7281" to-port="0" /> + <edge from-layer="7119" from-port="4" to-layer="7121" to-port="0" /> + <edge from-layer="7120" from-port="0" to-layer="7121" to-port="1" /> + <edge from-layer="7121" from-port="2" to-layer="7122" to-port="1" /> + <edge from-layer="7122" from-port="2" to-layer="7123" to-port="0" /> + <edge from-layer="7122" from-port="2" to-layer="7322" to-port="2" /> + <edge from-layer="7124" from-port="0" to-layer="7129" to-port="0" /> + <edge from-layer="7125" from-port="0" to-layer="7128" to-port="1" /> + <edge from-layer="7126" from-port="0" to-layer="7128" to-port="2" /> + <edge from-layer="7127" from-port="0" to-layer="7128" to-port="3" /> + <edge from-layer="7128" from-port="4" to-layer="7129" to-port="1" /> + <edge from-layer="7129" from-port="2" to-layer="7130" to-port="0" /> + <edge from-layer="7130" from-port="1" to-layer="7132" to-port="0" /> + <edge from-layer="7131" from-port="0" to-layer="7132" to-port="2" /> + <edge from-layer="7132" from-port="3" to-layer="7189" to-port="0" /> + <edge from-layer="7132" from-port="3" to-layer="7149" to-port="0" /> + <edge from-layer="7133" from-port="0" to-layer="7136" to-port="1" /> + <edge from-layer="7134" from-port="0" to-layer="7136" to-port="2" /> + <edge from-layer="7135" from-port="0" to-layer="7136" to-port="3" /> + <edge from-layer="7136" from-port="4" to-layer="7145" to-port="0" /> + <edge from-layer="7136" from-port="4" to-layer="7138" to-port="0" /> + <edge from-layer="7137" from-port="0" to-layer="7138" to-port="1" /> + <edge from-layer="7138" from-port="2" to-layer="7142" to-port="0" /> + <edge from-layer="7139" from-port="0" to-layer="7142" to-port="1" /> + <edge from-layer="7140" from-port="0" to-layer="7142" to-port="2" /> + <edge from-layer="7141" from-port="0" to-layer="7142" to-port="3" /> + <edge from-layer="7142" from-port="4" to-layer="7178" to-port="0" /> + <edge from-layer="7142" from-port="4" to-layer="7173" to-port="0" /> + <edge from-layer="7142" from-port="4" to-layer="7159" to-port="0" /> + <edge from-layer="7142" from-port="4" to-layer="7162" to-port="0" /> + <edge from-layer="7143" from-port="0" to-layer="7155" to-port="0" /> + <edge from-layer="7144" from-port="0" to-layer="7155" to-port="1" /> + <edge from-layer="7145" from-port="1" to-layer="7148" to-port="0" /> + <edge from-layer="7146" from-port="0" to-layer="7148" to-port="1" /> + <edge from-layer="7147" from-port="0" to-layer="7148" to-port="2" /> + <edge from-layer="7148" from-port="3" to-layer="7153" to-port="0" /> + <edge from-layer="7149" from-port="1" to-layer="7152" to-port="0" /> + <edge from-layer="7150" from-port="0" to-layer="7152" to-port="1" /> + <edge from-layer="7151" from-port="0" to-layer="7152" to-port="2" /> + <edge from-layer="7152" from-port="3" to-layer="7153" to-port="1" /> + <edge from-layer="7153" from-port="2" to-layer="7155" to-port="2" /> + <edge from-layer="7153" from-port="2" to-layer="7183" to-port="2" /> + <edge from-layer="7154" from-port="0" to-layer="7155" to-port="3" /> + <edge from-layer="7155" from-port="4" to-layer="7157" to-port="0" /> + <edge from-layer="7156" from-port="0" to-layer="7157" to-port="2" /> + <edge from-layer="7157" from-port="3" to-layer="7158" to-port="0" /> + <edge from-layer="7158" from-port="2" to-layer="7159" to-port="1" /> + <edge from-layer="7158" from-port="2" to-layer="7251" to-port="1" /> + <edge from-layer="7159" from-port="2" to-layer="7188" to-port="0" /> + <edge from-layer="7160" from-port="0" to-layer="7170" to-port="0" /> + <edge from-layer="7161" from-port="0" to-layer="7170" to-port="1" /> + <edge from-layer="7162" from-port="1" to-layer="7164" to-port="0" /> + <edge from-layer="7163" from-port="0" to-layer="7164" to-port="2" /> + <edge from-layer="7164" from-port="3" to-layer="7165" to-port="0" /> + <edge from-layer="7165" from-port="2" to-layer="7166" to-port="0" /> + <edge from-layer="7166" from-port="1" to-layer="7168" to-port="0" /> + <edge from-layer="7167" from-port="0" to-layer="7168" to-port="1" /> + <edge from-layer="7168" from-port="2" to-layer="7170" to-port="2" /> + <edge from-layer="7169" from-port="0" to-layer="7170" to-port="3" /> + <edge from-layer="7170" from-port="4" to-layer="7173" to-port="1" /> + <edge from-layer="7170" from-port="4" to-layer="7178" to-port="2" /> + <edge from-layer="7171" from-port="0" to-layer="7173" to-port="2" /> + <edge from-layer="7172" from-port="0" to-layer="7173" to-port="3" /> + <edge from-layer="7173" from-port="4" to-layer="7175" to-port="0" /> + <edge from-layer="7174" from-port="0" to-layer="7175" to-port="1" /> + <edge from-layer="7175" from-port="2" to-layer="7179" to-port="0" /> + <edge from-layer="7176" from-port="0" to-layer="7178" to-port="1" /> + <edge from-layer="7177" from-port="0" to-layer="7178" to-port="3" /> + <edge from-layer="7178" from-port="4" to-layer="7179" to-port="1" /> + <edge from-layer="7179" from-port="2" to-layer="7187" to-port="0" /> + <edge from-layer="7180" from-port="0" to-layer="7183" to-port="0" /> + <edge from-layer="7181" from-port="0" to-layer="7183" to-port="1" /> + <edge from-layer="7182" from-port="0" to-layer="7183" to-port="3" /> + <edge from-layer="7183" from-port="4" to-layer="7185" to-port="0" /> + <edge from-layer="7184" from-port="0" to-layer="7185" to-port="2" /> + <edge from-layer="7185" from-port="3" to-layer="7186" to-port="0" /> + <edge from-layer="7186" from-port="2" to-layer="7187" to-port="1" /> + <edge from-layer="7186" from-port="2" to-layer="7272" to-port="1" /> + <edge from-layer="7187" from-port="2" to-layer="7188" to-port="1" /> + <edge from-layer="7188" from-port="2" to-layer="7189" to-port="1" /> + <edge from-layer="7189" from-port="2" to-layer="7322" to-port="1" /> + <edge from-layer="7189" from-port="2" to-layer="7190" to-port="0" /> + <edge from-layer="7241" from-port="0" to-layer="7244" to-port="1" /> + <edge from-layer="7242" from-port="0" to-layer="7244" to-port="2" /> + <edge from-layer="7243" from-port="0" to-layer="7244" to-port="3" /> + <edge from-layer="7244" from-port="4" to-layer="7246" to-port="0" /> + <edge from-layer="7245" from-port="0" to-layer="7246" to-port="1" /> + <edge from-layer="7246" from-port="2" to-layer="7250" to-port="0" /> + <edge from-layer="7247" from-port="0" to-layer="7250" to-port="1" /> + <edge from-layer="7248" from-port="0" to-layer="7250" to-port="2" /> + <edge from-layer="7249" from-port="0" to-layer="7250" to-port="3" /> + <edge from-layer="7250" from-port="4" to-layer="7270" to-port="0" /> + <edge from-layer="7250" from-port="4" to-layer="7265" to-port="0" /> + <edge from-layer="7250" from-port="4" to-layer="7254" to-port="0" /> + <edge from-layer="7250" from-port="4" to-layer="7251" to-port="0" /> + <edge from-layer="7251" from-port="2" to-layer="7273" to-port="0" /> + <edge from-layer="7252" from-port="0" to-layer="7262" to-port="0" /> + <edge from-layer="7253" from-port="0" to-layer="7262" to-port="1" /> + <edge from-layer="7254" from-port="1" to-layer="7256" to-port="0" /> + <edge from-layer="7255" from-port="0" to-layer="7256" to-port="2" /> + <edge from-layer="7256" from-port="3" to-layer="7257" to-port="0" /> + <edge from-layer="7257" from-port="2" to-layer="7258" to-port="0" /> + <edge from-layer="7258" from-port="1" to-layer="7260" to-port="0" /> + <edge from-layer="7259" from-port="0" to-layer="7260" to-port="1" /> + <edge from-layer="7260" from-port="2" to-layer="7262" to-port="2" /> + <edge from-layer="7261" from-port="0" to-layer="7262" to-port="3" /> + <edge from-layer="7262" from-port="4" to-layer="7265" to-port="1" /> + <edge from-layer="7262" from-port="4" to-layer="7270" to-port="2" /> + <edge from-layer="7263" from-port="0" to-layer="7265" to-port="2" /> + <edge from-layer="7264" from-port="0" to-layer="7265" to-port="3" /> + <edge from-layer="7265" from-port="4" to-layer="7267" to-port="0" /> + <edge from-layer="7266" from-port="0" to-layer="7267" to-port="1" /> + <edge from-layer="7267" from-port="2" to-layer="7271" to-port="0" /> + <edge from-layer="7268" from-port="0" to-layer="7270" to-port="1" /> + <edge from-layer="7269" from-port="0" to-layer="7270" to-port="3" /> + <edge from-layer="7270" from-port="4" to-layer="7271" to-port="1" /> + <edge from-layer="7271" from-port="2" to-layer="7272" to-port="0" /> + <edge from-layer="7272" from-port="2" to-layer="7273" to-port="1" /> + <edge from-layer="7273" from-port="2" to-layer="7322" to-port="0" /> + <edge from-layer="7273" from-port="2" to-layer="7286" to-port="0" /> + <edge from-layer="7274" from-port="0" to-layer="7300" to-port="0" /> + <edge from-layer="7275" from-port="0" to-layer="7294" to-port="0" /> + <edge from-layer="7276" from-port="0" to-layer="7298" to-port="1" /> + <edge from-layer="7276" from-port="0" to-layer="7294" to-port="1" /> + <edge from-layer="7277" from-port="1" to-layer="7280" to-port="0" /> + <edge from-layer="7278" from-port="0" to-layer="7280" to-port="1" /> + <edge from-layer="7279" from-port="0" to-layer="7280" to-port="2" /> + <edge from-layer="7280" from-port="3" to-layer="7285" to-port="0" /> + <edge from-layer="7281" from-port="1" to-layer="7284" to-port="0" /> + <edge from-layer="7282" from-port="0" to-layer="7284" to-port="1" /> + <edge from-layer="7283" from-port="0" to-layer="7284" to-port="2" /> + <edge from-layer="7284" from-port="3" to-layer="7285" to-port="1" /> + <edge from-layer="7285" from-port="2" to-layer="7290" to-port="0" /> + <edge from-layer="7285" from-port="2" to-layer="7297" to-port="0" /> + <edge from-layer="7286" from-port="1" to-layer="7289" to-port="0" /> + <edge from-layer="7286" from-port="1" to-layer="7315" to-port="0" /> + <edge from-layer="7287" from-port="0" to-layer="7289" to-port="1" /> + <edge from-layer="7288" from-port="0" to-layer="7289" to-port="2" /> + <edge from-layer="7289" from-port="3" to-layer="7290" to-port="1" /> + <edge from-layer="7290" from-port="2" to-layer="7292" to-port="0" /> + <edge from-layer="7291" from-port="0" to-layer="7292" to-port="1" /> + <edge from-layer="7292" from-port="2" to-layer="7294" to-port="2" /> + <edge from-layer="7293" from-port="0" to-layer="7298" to-port="3" /> + <edge from-layer="7293" from-port="0" to-layer="7294" to-port="3" /> + <edge from-layer="7294" from-port="4" to-layer="7300" to-port="1" /> + <edge from-layer="7295" from-port="0" to-layer="7298" to-port="0" /> + <edge from-layer="7296" from-port="0" to-layer="7297" to-port="1" /> + <edge from-layer="7297" from-port="2" to-layer="7305" to-port="2" /> + <edge from-layer="7297" from-port="2" to-layer="7298" to-port="2" /> + <edge from-layer="7298" from-port="4" to-layer="7300" to-port="2" /> + <edge from-layer="7299" from-port="0" to-layer="7300" to-port="3" /> + <edge from-layer="7300" from-port="4" to-layer="7307" to-port="0" /> + <edge from-layer="7301" from-port="0" to-layer="7307" to-port="1" /> + <edge from-layer="7302" from-port="0" to-layer="7305" to-port="0" /> + <edge from-layer="7303" from-port="0" to-layer="7305" to-port="1" /> + <edge from-layer="7304" from-port="0" to-layer="7305" to-port="3" /> + <edge from-layer="7305" from-port="4" to-layer="7307" to-port="2" /> + <edge from-layer="7306" from-port="0" to-layer="7307" to-port="3" /> + <edge from-layer="7307" from-port="4" to-layer="7310" to-port="0" /> + <edge from-layer="7308" from-port="0" to-layer="7310" to-port="1" /> + <edge from-layer="7309" from-port="0" to-layer="7310" to-port="2" /> + <edge from-layer="7310" from-port="3" to-layer="7311" to-port="0" /> + <edge from-layer="7311" from-port="2" to-layer="7321" to-port="0" /> + <edge from-layer="7311" from-port="2" to-layer="7312" to-port="0" /> + <edge from-layer="7312" from-port="1" to-layer="7320" to-port="0" /> + <edge from-layer="7313" from-port="0" to-layer="7315" to-port="1" /> + <edge from-layer="7314" from-port="0" to-layer="7315" to-port="2" /> + <edge from-layer="7315" from-port="3" to-layer="7319" to-port="0" /> + <edge from-layer="7316" from-port="0" to-layer="7319" to-port="1" /> + <edge from-layer="7317" from-port="0" to-layer="7319" to-port="2" /> + <edge from-layer="7318" from-port="0" to-layer="7319" to-port="3" /> + <edge from-layer="7319" from-port="4" to-layer="7320" to-port="1" /> + <edge from-layer="7320" from-port="2" to-layer="7321" to-port="1" /> + <edge from-layer="7321" from-port="2" to-layer="7322" to-port="3" /> + <edge from-layer="7322" from-port="4" to-layer="7324" to-port="0" /> + <edge from-layer="7323" from-port="0" to-layer="7324" to-port="1" /> + <edge from-layer="7324" from-port="2" to-layer="7326" to-port="0" /> + <edge from-layer="7325" from-port="0" to-layer="7326" to-port="1" /> + <edge from-layer="7326" from-port="2" to-layer="7335" to-port="0" /> + <edge from-layer="7327" from-port="0" to-layer="7328" to-port="0" /> + <edge from-layer="7328" from-port="1" to-layer="7331" to-port="0" /> + <edge from-layer="7329" from-port="0" to-layer="7330" to-port="0" /> + <edge from-layer="7330" from-port="1" to-layer="7331" to-port="1" /> + <edge from-layer="7331" from-port="2" to-layer="7333" to-port="0" /> + <edge from-layer="7332" from-port="0" to-layer="7333" to-port="1" /> + <edge from-layer="7333" from-port="2" to-layer="7334" to-port="0" /> + <edge from-layer="7334" from-port="1" to-layer="7335" to-port="1" /> + <edge from-layer="7335" from-port="2" to-layer="7337" to-port="0" /> + <edge from-layer="7336" from-port="0" to-layer="7337" to-port="1" /> + <edge from-layer="7337" from-port="2" to-layer="7338" to-port="0" /> + <edge from-layer="7338" from-port="2" to-layer="7340" to-port="0" /> + <edge from-layer="7338" from-port="2" to-layer="7368" to-port="1" /> + <edge from-layer="7339" from-port="0" to-layer="7340" to-port="1" /> + <edge from-layer="7340" from-port="2" to-layer="7342" to-port="0" /> + <edge from-layer="7341" from-port="0" to-layer="7342" to-port="1" /> + <edge from-layer="7342" from-port="2" to-layer="7344" to-port="0" /> + <edge from-layer="7343" from-port="0" to-layer="7344" to-port="1" /> + <edge from-layer="7344" from-port="2" to-layer="7353" to-port="0" /> + <edge from-layer="7345" from-port="0" to-layer="7346" to-port="0" /> + <edge from-layer="7346" from-port="1" to-layer="7349" to-port="0" /> + <edge from-layer="7347" from-port="0" to-layer="7348" to-port="0" /> + <edge from-layer="7348" from-port="1" to-layer="7349" to-port="1" /> + <edge from-layer="7349" from-port="2" to-layer="7351" to-port="0" /> + <edge from-layer="7350" from-port="0" to-layer="7351" to-port="1" /> + <edge from-layer="7351" from-port="2" to-layer="7352" to-port="0" /> + <edge from-layer="7352" from-port="1" to-layer="7353" to-port="1" /> + <edge from-layer="7353" from-port="2" to-layer="7355" to-port="0" /> + <edge from-layer="7354" from-port="0" to-layer="7355" to-port="1" /> + <edge from-layer="7355" from-port="2" to-layer="7356" to-port="0" /> + <edge from-layer="7356" from-port="1" to-layer="7365" to-port="0" /> + <edge from-layer="7357" from-port="0" to-layer="7358" to-port="0" /> + <edge from-layer="7358" from-port="1" to-layer="7361" to-port="0" /> + <edge from-layer="7359" from-port="0" to-layer="7360" to-port="0" /> + <edge from-layer="7360" from-port="1" to-layer="7361" to-port="1" /> + <edge from-layer="7361" from-port="2" to-layer="7363" to-port="0" /> + <edge from-layer="7362" from-port="0" to-layer="7363" to-port="1" /> + <edge from-layer="7363" from-port="2" to-layer="7364" to-port="0" /> + <edge from-layer="7364" from-port="1" to-layer="7365" to-port="1" /> + <edge from-layer="7365" from-port="2" to-layer="7367" to-port="0" /> + <edge from-layer="7366" from-port="0" to-layer="7367" to-port="1" /> + <edge from-layer="7367" from-port="2" to-layer="7368" to-port="0" /> + <edge from-layer="7368" from-port="2" to-layer="7370" to-port="0" /> + <edge from-layer="7369" from-port="0" to-layer="7370" to-port="1" /> + <edge from-layer="7370" from-port="2" to-layer="7372" to-port="0" /> + <edge from-layer="7371" from-port="0" to-layer="7372" to-port="1" /> + <edge from-layer="7372" from-port="2" to-layer="7374" to-port="0" /> + <edge from-layer="7373" from-port="0" to-layer="7374" to-port="1" /> + <edge from-layer="7374" from-port="2" to-layer="7383" to-port="0" /> + <edge from-layer="7375" from-port="0" to-layer="7376" to-port="0" /> + <edge from-layer="7376" from-port="1" to-layer="7379" to-port="0" /> + <edge from-layer="7377" from-port="0" to-layer="7378" to-port="0" /> + <edge from-layer="7378" from-port="1" to-layer="7379" to-port="1" /> + <edge from-layer="7379" from-port="2" to-layer="7381" to-port="0" /> + <edge from-layer="7380" from-port="0" to-layer="7381" to-port="1" /> + <edge from-layer="7381" from-port="2" to-layer="7382" to-port="0" /> + <edge from-layer="7382" from-port="1" to-layer="7383" to-port="1" /> + <edge from-layer="7383" from-port="2" to-layer="7384" to-port="0" /> + </edges> + <rt_info> + <Runtime_version value="2024.2.0-15519-5c0f38f83f6-releases/2024/2" /> + <conversion_parameters> + <framework value="pytorch" /> + <is_python_object value="True" /> + </conversion_parameters> + <nncf> + <friendly_names_were_updated value="True" /> + <weight_compression> + <all_layers value="False" /> + <awq value="False" /> + <gptq value="False" /> + <group_size value="-1" /> + <ignored_scope value="[]" /> + <mode value="int8_asym" /> + <ratio value="1" /> + <scale_estimation value="False" /> + <sensitivity_metric value="weight_quantization_error" /> + </weight_compression> + </nncf> + <optimum> + <nncf_version value="2.12.0.dev0+e8ea2521" /> + <optimum_intel_version value="1.18.0.dev0+0a6075b" /> + <optimum_version value="1.20.0" /> + <pytorch_version value="2.3.0" /> + <transformers_version value="4.41.2" /> + </optimum> + </rt_info> +</net>