whisper-base-fp16-ov / openvino_encoder_model.xml
openvino-ci's picture
Upload folder using huggingface_hub
810a7a4 verified
<?xml version="1.0"?>
<net name="Model0" version="11">
<layers>
<layer id="0" name="input_features" type="Parameter" version="opset1">
<data shape="?,80,3000" element_type="f32" />
<output>
<port id="0" precision="FP32" names="input_features">
<dim>-1</dim>
<dim>80</dim>
<dim>3000</dim>
</port>
</output>
</layer>
<layer id="1" name="self.conv1.weight" type="Const" version="opset1">
<data element_type="f32" shape="512, 80, 3" offset="0" size="491520" />
<output>
<port id="0" precision="FP32" names="self.conv1.weight">
<dim>512</dim>
<dim>80</dim>
<dim>3</dim>
</port>
</output>
</layer>
<layer id="2" name="__module.conv1/aten::_convolution/Convolution" type="Convolution" version="opset1">
<data strides="1" dilations="1" pads_begin="1" pads_end="1" auto_pad="explicit" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>80</dim>
<dim>3000</dim>
</port>
<port id="1" precision="FP32">
<dim>512</dim>
<dim>80</dim>
<dim>3</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>512</dim>
<dim>3000</dim>
</port>
</output>
</layer>
<layer id="3" name="__module.conv1/aten::_convolution/Reshape" type="Const" version="opset1">
<data element_type="f32" shape="1, 512, 1" offset="491520" size="2048" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>512</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="4" name="__module.conv1/aten::_convolution/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>512</dim>
<dim>3000</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>512</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="53">
<dim>-1</dim>
<dim>512</dim>
<dim>3000</dim>
</port>
</output>
</layer>
<layer id="5" name="aten::gelu/Gelu" type="Gelu" version="opset7">
<data approximation_mode="ERF" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>512</dim>
<dim>3000</dim>
</port>
</input>
<output>
<port id="1" precision="FP32" names="21">
<dim>-1</dim>
<dim>512</dim>
<dim>3000</dim>
</port>
</output>
</layer>
<layer id="6" name="self.conv2.weight" type="Const" version="opset1">
<data element_type="f32" shape="512, 512, 3" offset="493568" size="3145728" />
<output>
<port id="0" precision="FP32" names="self.conv2.weight">
<dim>512</dim>
<dim>512</dim>
<dim>3</dim>
</port>
</output>
</layer>
<layer id="7" name="__module.conv2/aten::_convolution/Convolution" type="Convolution" version="opset1">
<data strides="2" dilations="1" pads_begin="1" pads_end="1" auto_pad="explicit" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>512</dim>
<dim>3000</dim>
</port>
<port id="1" precision="FP32">
<dim>512</dim>
<dim>512</dim>
<dim>3</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>512</dim>
<dim>1500</dim>
</port>
</output>
</layer>
<layer id="8" name="__module.conv2/aten::_convolution/Reshape" type="Const" version="opset1">
<data element_type="f32" shape="1, 512, 1" offset="3639296" size="2048" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>512</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="9" name="__module.conv2/aten::_convolution/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>512</dim>
<dim>1500</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>512</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="65">
<dim>-1</dim>
<dim>512</dim>
<dim>1500</dim>
</port>
</output>
</layer>
<layer id="10" name="aten::gelu/Gelu_1" type="Gelu" version="opset7">
<data approximation_mode="ERF" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>512</dim>
<dim>1500</dim>
</port>
</input>
<output>
<port id="1" precision="FP32" names="24,inputs_embeds.1">
<dim>-1</dim>
<dim>512</dim>
<dim>1500</dim>
</port>
</output>
</layer>
<layer id="11" name="Constant_120" type="Const" version="opset1">
<data element_type="i64" shape="3" offset="3641344" size="24" />
<output>
<port id="0" precision="I64" names="28">
<dim>3</dim>
</port>
</output>
</layer>
<layer id="12" name="aten::permute/Transpose" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>512</dim>
<dim>1500</dim>
</port>
<port id="1" precision="I64">
<dim>3</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="29,inputs_embeds">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="13" name="Constant_5893" type="Const" version="opset1">
<data element_type="f32" shape="1, 1500, 512" offset="3641368" size="3072000" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="14" name="aten::add/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="31,input.1">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="15" name="__module.layers.0.self_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1">
<data element_type="i32" shape="1" offset="6713368" size="4" />
<output>
<port id="0" precision="I32">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="16" name="__module.layers.0.self_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6">
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="I32">
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="17" name="Constant_5894" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 512" offset="6713372" size="2048" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="18" name="__module.layers.0.self_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="19" name="Constant_5895" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 512" offset="6715420" size="2048" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="20" name="__module.layers.0.self_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="88,hidden_states.1">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="21" name="self.layers.0.self_attn.q_proj.weight" type="Const" version="opset1">
<data element_type="f32" shape="512, 512" offset="6717468" size="1048576" />
<output>
<port id="0" precision="FP32" names="self.layers.0.self_attn.q_proj.weight">
<dim>512</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="22" name="__module.layers.0.self_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>512</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="23" name="Constant_5896" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 512" offset="7766044" size="2048" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="24" name="__module.layers.0.self_attn.q_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="97,tensor.1">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="25" name="Constant_6056" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="7768092" size="32" />
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="26" name="__module.layers.0.self_attn/aten::view/Reshape" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="99">
<dim>-1</dim>
<dim>1500</dim>
<dim>8</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="27" name="__module.layers.0.self_attn/aten::transpose/Constant" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="7768124" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="28" name="__module.layers.0.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>8</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="100">
<dim>-1</dim>
<dim>8</dim>
<dim>1500</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="29" name="self.layers.0.self_attn.k_proj.weight" type="Const" version="opset1">
<data element_type="f32" shape="512, 512" offset="7768140" size="1048576" />
<output>
<port id="0" precision="FP32" names="self.layers.0.self_attn.k_proj.weight">
<dim>512</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="30" name="__module.layers.0.self_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>512</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="103,tensor.3">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="31" name="Constant_6057" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="7768092" size="32" />
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="32" name="__module.layers.0.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="105">
<dim>-1</dim>
<dim>1500</dim>
<dim>8</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="33" name="__module.layers.0.self_attn/aten::transpose/Constant_1" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="7768124" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="34" name="__module.layers.0.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>8</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="106">
<dim>-1</dim>
<dim>8</dim>
<dim>1500</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="35" name="self.layers.0.self_attn.v_proj.weight" type="Const" version="opset1">
<data element_type="f32" shape="512, 512" offset="8816716" size="1048576" />
<output>
<port id="0" precision="FP32" names="self.layers.0.self_attn.v_proj.weight">
<dim>512</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="36" name="__module.layers.0.self_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>512</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="37" name="Constant_5897" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 512" offset="9865292" size="2048" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="38" name="__module.layers.0.self_attn.v_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="110,tensor.5">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="39" name="Constant_6058" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="7768092" size="32" />
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="40" name="__module.layers.0.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="112">
<dim>-1</dim>
<dim>1500</dim>
<dim>8</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="41" name="__module.layers.0.self_attn/aten::transpose/Constant_2" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="7768124" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="42" name="__module.layers.0.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>8</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="113">
<dim>-1</dim>
<dim>8</dim>
<dim>1500</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="43" name="__module.layers.0.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13">
<data causal="false" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>8</dim>
<dim>1500</dim>
<dim>64</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>8</dim>
<dim>1500</dim>
<dim>64</dim>
</port>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>8</dim>
<dim>1500</dim>
<dim>64</dim>
</port>
</input>
<output>
<port id="3" precision="FP32" names="115,attn_output.1">
<dim>-1</dim>
<dim>8</dim>
<dim>1500</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="44" name="__module.layers.0.self_attn/aten::transpose/Constant_3" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="7768124" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="45" name="__module.layers.0.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>8</dim>
<dim>1500</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="116,attn_output.3">
<dim>-1</dim>
<dim>1500</dim>
<dim>8</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="46" name="Constant_6059" type="Const" version="opset1">
<data element_type="i64" shape="3" offset="9867340" size="24" />
<output>
<port id="0" precision="I64">
<dim>3</dim>
</port>
</output>
</layer>
<layer id="47" name="__module.layers.0.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>8</dim>
<dim>64</dim>
</port>
<port id="1" precision="I64">
<dim>3</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="118">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="48" name="self.layers.0.self_attn.out_proj.weight" type="Const" version="opset1">
<data element_type="f32" shape="512, 512" offset="9867364" size="1048576" />
<output>
<port id="0" precision="FP32" names="self.layers.0.self_attn.out_proj.weight">
<dim>512</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="49" name="__module.layers.0.self_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>512</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="50" name="Constant_5898" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 512" offset="10915940" size="2048" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="51" name="__module.layers.0.self_attn.out_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="121,input.3">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="52" name="__module.layers.0/aten::add/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="123,residual.3">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="53" name="__module.layers.0.final_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1">
<data element_type="i32" shape="1" offset="6713368" size="4" />
<output>
<port id="0" precision="I32">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="54" name="__module.layers.0.final_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6">
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="I32">
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="55" name="Constant_5899" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 512" offset="10917988" size="2048" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="56" name="__module.layers.0.final_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="57" name="Constant_5900" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 512" offset="10920036" size="2048" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="58" name="__module.layers.0.final_layer_norm/aten::layer_norm/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="127">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="59" name="self.layers.0.fc1.weight" type="Const" version="opset1">
<data element_type="f32" shape="2048, 512" offset="10922084" size="4194304" />
<output>
<port id="0" precision="FP32" names="self.layers.0.fc1.weight">
<dim>2048</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="60" name="__module.layers.0.fc1/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>2048</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>2048</dim>
</port>
</output>
</layer>
<layer id="61" name="Constant_5901" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 2048" offset="15116388" size="8192" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>2048</dim>
</port>
</output>
</layer>
<layer id="62" name="__module.layers.0.fc1/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>2048</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>2048</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="130">
<dim>-1</dim>
<dim>1500</dim>
<dim>2048</dim>
</port>
</output>
</layer>
<layer id="63" name="__module.layers.0.activation_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
<data approximation_mode="ERF" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>2048</dim>
</port>
</input>
<output>
<port id="1" precision="FP32" names="131,input.5">
<dim>-1</dim>
<dim>1500</dim>
<dim>2048</dim>
</port>
</output>
</layer>
<layer id="64" name="self.layers.0.fc2.weight" type="Const" version="opset1">
<data element_type="f32" shape="512, 2048" offset="15124580" size="4194304" />
<output>
<port id="0" precision="FP32" names="self.layers.0.fc2.weight">
<dim>512</dim>
<dim>2048</dim>
</port>
</output>
</layer>
<layer id="65" name="__module.layers.0.fc2/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>2048</dim>
</port>
<port id="1" precision="FP32">
<dim>512</dim>
<dim>2048</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="66" name="Constant_5902" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 512" offset="19318884" size="2048" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="67" name="__module.layers.0.fc2/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="135,input.7">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="68" name="__module.layers.0/aten::add/Add_1" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="137,residual.5">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="69" name="__module.layers.1.self_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1">
<data element_type="i32" shape="1" offset="6713368" size="4" />
<output>
<port id="0" precision="I32">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="70" name="__module.layers.1.self_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6">
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="I32">
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="71" name="Constant_5903" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 512" offset="19320932" size="2048" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="72" name="__module.layers.1.self_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="73" name="Constant_5904" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 512" offset="19322980" size="2048" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="74" name="__module.layers.1.self_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="160,hidden_states.7">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="75" name="self.layers.1.self_attn.q_proj.weight" type="Const" version="opset1">
<data element_type="f32" shape="512, 512" offset="19325028" size="1048576" />
<output>
<port id="0" precision="FP32" names="self.layers.1.self_attn.q_proj.weight">
<dim>512</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="76" name="__module.layers.1.self_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>512</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="77" name="Constant_5905" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 512" offset="20373604" size="2048" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="78" name="__module.layers.1.self_attn.q_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="169,tensor.7">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="79" name="Constant_6060" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="7768092" size="32" />
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="80" name="__module.layers.1.self_attn/aten::view/Reshape" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="171">
<dim>-1</dim>
<dim>1500</dim>
<dim>8</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="81" name="__module.layers.1.self_attn/aten::transpose/Constant" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="7768124" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="82" name="__module.layers.1.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>8</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="172">
<dim>-1</dim>
<dim>8</dim>
<dim>1500</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="83" name="self.layers.1.self_attn.k_proj.weight" type="Const" version="opset1">
<data element_type="f32" shape="512, 512" offset="20375652" size="1048576" />
<output>
<port id="0" precision="FP32" names="self.layers.1.self_attn.k_proj.weight">
<dim>512</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="84" name="__module.layers.1.self_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>512</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="175,tensor.9">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="85" name="Constant_6061" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="7768092" size="32" />
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="86" name="__module.layers.1.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="177">
<dim>-1</dim>
<dim>1500</dim>
<dim>8</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="87" name="__module.layers.1.self_attn/aten::transpose/Constant_1" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="7768124" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="88" name="__module.layers.1.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>8</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="178">
<dim>-1</dim>
<dim>8</dim>
<dim>1500</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="89" name="self.layers.1.self_attn.v_proj.weight" type="Const" version="opset1">
<data element_type="f32" shape="512, 512" offset="21424228" size="1048576" />
<output>
<port id="0" precision="FP32" names="self.layers.1.self_attn.v_proj.weight">
<dim>512</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="90" name="__module.layers.1.self_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>512</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="91" name="Constant_5906" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 512" offset="22472804" size="2048" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="92" name="__module.layers.1.self_attn.v_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="182,tensor.11">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="93" name="Constant_6062" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="7768092" size="32" />
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="94" name="__module.layers.1.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="184">
<dim>-1</dim>
<dim>1500</dim>
<dim>8</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="95" name="__module.layers.1.self_attn/aten::transpose/Constant_2" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="7768124" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="96" name="__module.layers.1.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>8</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="185">
<dim>-1</dim>
<dim>8</dim>
<dim>1500</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="97" name="__module.layers.1.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13">
<data causal="false" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>8</dim>
<dim>1500</dim>
<dim>64</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>8</dim>
<dim>1500</dim>
<dim>64</dim>
</port>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>8</dim>
<dim>1500</dim>
<dim>64</dim>
</port>
</input>
<output>
<port id="3" precision="FP32" names="187,attn_output.5">
<dim>-1</dim>
<dim>8</dim>
<dim>1500</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="98" name="__module.layers.1.self_attn/aten::transpose/Constant_3" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="7768124" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="99" name="__module.layers.1.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>8</dim>
<dim>1500</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="188,attn_output.7">
<dim>-1</dim>
<dim>1500</dim>
<dim>8</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="100" name="Constant_6063" type="Const" version="opset1">
<data element_type="i64" shape="3" offset="9867340" size="24" />
<output>
<port id="0" precision="I64">
<dim>3</dim>
</port>
</output>
</layer>
<layer id="101" name="__module.layers.1.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>8</dim>
<dim>64</dim>
</port>
<port id="1" precision="I64">
<dim>3</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="190">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="102" name="self.layers.1.self_attn.out_proj.weight" type="Const" version="opset1">
<data element_type="f32" shape="512, 512" offset="22474852" size="1048576" />
<output>
<port id="0" precision="FP32" names="self.layers.1.self_attn.out_proj.weight">
<dim>512</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="103" name="__module.layers.1.self_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>512</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="104" name="Constant_5907" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 512" offset="23523428" size="2048" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="105" name="__module.layers.1.self_attn.out_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="193,input.9">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="106" name="__module.layers.1/aten::add/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="195,residual.7">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="107" name="__module.layers.1.final_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1">
<data element_type="i32" shape="1" offset="6713368" size="4" />
<output>
<port id="0" precision="I32">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="108" name="__module.layers.1.final_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6">
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="I32">
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="109" name="Constant_5908" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 512" offset="23525476" size="2048" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="110" name="__module.layers.1.final_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="111" name="Constant_5909" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 512" offset="23527524" size="2048" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="112" name="__module.layers.1.final_layer_norm/aten::layer_norm/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="199">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="113" name="self.layers.1.fc1.weight" type="Const" version="opset1">
<data element_type="f32" shape="2048, 512" offset="23529572" size="4194304" />
<output>
<port id="0" precision="FP32" names="self.layers.1.fc1.weight">
<dim>2048</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="114" name="__module.layers.1.fc1/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>2048</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>2048</dim>
</port>
</output>
</layer>
<layer id="115" name="Constant_5910" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 2048" offset="27723876" size="8192" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>2048</dim>
</port>
</output>
</layer>
<layer id="116" name="__module.layers.1.fc1/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>2048</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>2048</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="202">
<dim>-1</dim>
<dim>1500</dim>
<dim>2048</dim>
</port>
</output>
</layer>
<layer id="117" name="__module.layers.1.activation_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
<data approximation_mode="ERF" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>2048</dim>
</port>
</input>
<output>
<port id="1" precision="FP32" names="203,input.11">
<dim>-1</dim>
<dim>1500</dim>
<dim>2048</dim>
</port>
</output>
</layer>
<layer id="118" name="self.layers.1.fc2.weight" type="Const" version="opset1">
<data element_type="f32" shape="512, 2048" offset="27732068" size="4194304" />
<output>
<port id="0" precision="FP32" names="self.layers.1.fc2.weight">
<dim>512</dim>
<dim>2048</dim>
</port>
</output>
</layer>
<layer id="119" name="__module.layers.1.fc2/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>2048</dim>
</port>
<port id="1" precision="FP32">
<dim>512</dim>
<dim>2048</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="120" name="Constant_5911" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 512" offset="31926372" size="2048" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="121" name="__module.layers.1.fc2/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="207,input.13">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="122" name="__module.layers.1/aten::add/Add_1" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="209,residual.9">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="123" name="__module.layers.2.self_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1">
<data element_type="i32" shape="1" offset="6713368" size="4" />
<output>
<port id="0" precision="I32">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="124" name="__module.layers.2.self_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6">
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="I32">
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="125" name="Constant_5912" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 512" offset="31928420" size="2048" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="126" name="__module.layers.2.self_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="127" name="Constant_5913" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 512" offset="31930468" size="2048" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="128" name="__module.layers.2.self_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="232,hidden_states.13">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="129" name="self.layers.2.self_attn.q_proj.weight" type="Const" version="opset1">
<data element_type="f32" shape="512, 512" offset="31932516" size="1048576" />
<output>
<port id="0" precision="FP32" names="self.layers.2.self_attn.q_proj.weight">
<dim>512</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="130" name="__module.layers.2.self_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>512</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="131" name="Constant_5914" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 512" offset="32981092" size="2048" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="132" name="__module.layers.2.self_attn.q_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="241,tensor.13">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="133" name="Constant_6064" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="7768092" size="32" />
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="134" name="__module.layers.2.self_attn/aten::view/Reshape" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="243">
<dim>-1</dim>
<dim>1500</dim>
<dim>8</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="135" name="__module.layers.2.self_attn/aten::transpose/Constant" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="7768124" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="136" name="__module.layers.2.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>8</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="244">
<dim>-1</dim>
<dim>8</dim>
<dim>1500</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="137" name="self.layers.2.self_attn.k_proj.weight" type="Const" version="opset1">
<data element_type="f32" shape="512, 512" offset="32983140" size="1048576" />
<output>
<port id="0" precision="FP32" names="self.layers.2.self_attn.k_proj.weight">
<dim>512</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="138" name="__module.layers.2.self_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>512</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="247,tensor.15">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="139" name="Constant_6065" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="7768092" size="32" />
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="140" name="__module.layers.2.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="249">
<dim>-1</dim>
<dim>1500</dim>
<dim>8</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="141" name="__module.layers.2.self_attn/aten::transpose/Constant_1" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="7768124" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="142" name="__module.layers.2.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>8</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="250">
<dim>-1</dim>
<dim>8</dim>
<dim>1500</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="143" name="self.layers.2.self_attn.v_proj.weight" type="Const" version="opset1">
<data element_type="f32" shape="512, 512" offset="34031716" size="1048576" />
<output>
<port id="0" precision="FP32" names="self.layers.2.self_attn.v_proj.weight">
<dim>512</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="144" name="__module.layers.2.self_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>512</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="145" name="Constant_5915" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 512" offset="35080292" size="2048" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="146" name="__module.layers.2.self_attn.v_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="254,tensor.17">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="147" name="Constant_6066" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="7768092" size="32" />
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="148" name="__module.layers.2.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="256">
<dim>-1</dim>
<dim>1500</dim>
<dim>8</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="149" name="__module.layers.2.self_attn/aten::transpose/Constant_2" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="7768124" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="150" name="__module.layers.2.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>8</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="257">
<dim>-1</dim>
<dim>8</dim>
<dim>1500</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="151" name="__module.layers.2.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13">
<data causal="false" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>8</dim>
<dim>1500</dim>
<dim>64</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>8</dim>
<dim>1500</dim>
<dim>64</dim>
</port>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>8</dim>
<dim>1500</dim>
<dim>64</dim>
</port>
</input>
<output>
<port id="3" precision="FP32" names="259,attn_output.9">
<dim>-1</dim>
<dim>8</dim>
<dim>1500</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="152" name="__module.layers.2.self_attn/aten::transpose/Constant_3" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="7768124" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="153" name="__module.layers.2.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>8</dim>
<dim>1500</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="260,attn_output.11">
<dim>-1</dim>
<dim>1500</dim>
<dim>8</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="154" name="Constant_6067" type="Const" version="opset1">
<data element_type="i64" shape="3" offset="9867340" size="24" />
<output>
<port id="0" precision="I64">
<dim>3</dim>
</port>
</output>
</layer>
<layer id="155" name="__module.layers.2.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>8</dim>
<dim>64</dim>
</port>
<port id="1" precision="I64">
<dim>3</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="262">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="156" name="self.layers.2.self_attn.out_proj.weight" type="Const" version="opset1">
<data element_type="f32" shape="512, 512" offset="35082340" size="1048576" />
<output>
<port id="0" precision="FP32" names="self.layers.2.self_attn.out_proj.weight">
<dim>512</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="157" name="__module.layers.2.self_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>512</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="158" name="Constant_5916" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 512" offset="36130916" size="2048" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="159" name="__module.layers.2.self_attn.out_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="265,input.15">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="160" name="__module.layers.2/aten::add/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="267,residual.11">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="161" name="__module.layers.2.final_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1">
<data element_type="i32" shape="1" offset="6713368" size="4" />
<output>
<port id="0" precision="I32">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="162" name="__module.layers.2.final_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6">
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="I32">
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="163" name="Constant_5917" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 512" offset="36132964" size="2048" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="164" name="__module.layers.2.final_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="165" name="Constant_5918" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 512" offset="36135012" size="2048" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="166" name="__module.layers.2.final_layer_norm/aten::layer_norm/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="271">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="167" name="self.layers.2.fc1.weight" type="Const" version="opset1">
<data element_type="f32" shape="2048, 512" offset="36137060" size="4194304" />
<output>
<port id="0" precision="FP32" names="self.layers.2.fc1.weight">
<dim>2048</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="168" name="__module.layers.2.fc1/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>2048</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>2048</dim>
</port>
</output>
</layer>
<layer id="169" name="Constant_5919" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 2048" offset="40331364" size="8192" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>2048</dim>
</port>
</output>
</layer>
<layer id="170" name="__module.layers.2.fc1/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>2048</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>2048</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="274">
<dim>-1</dim>
<dim>1500</dim>
<dim>2048</dim>
</port>
</output>
</layer>
<layer id="171" name="__module.layers.2.activation_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
<data approximation_mode="ERF" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>2048</dim>
</port>
</input>
<output>
<port id="1" precision="FP32" names="275,input.17">
<dim>-1</dim>
<dim>1500</dim>
<dim>2048</dim>
</port>
</output>
</layer>
<layer id="172" name="self.layers.2.fc2.weight" type="Const" version="opset1">
<data element_type="f32" shape="512, 2048" offset="40339556" size="4194304" />
<output>
<port id="0" precision="FP32" names="self.layers.2.fc2.weight">
<dim>512</dim>
<dim>2048</dim>
</port>
</output>
</layer>
<layer id="173" name="__module.layers.2.fc2/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>2048</dim>
</port>
<port id="1" precision="FP32">
<dim>512</dim>
<dim>2048</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="174" name="Constant_5920" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 512" offset="44533860" size="2048" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="175" name="__module.layers.2.fc2/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="279,input.19">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="176" name="__module.layers.2/aten::add/Add_1" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="281,residual.13">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="177" name="__module.layers.3.self_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1">
<data element_type="i32" shape="1" offset="6713368" size="4" />
<output>
<port id="0" precision="I32">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="178" name="__module.layers.3.self_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6">
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="I32">
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="179" name="Constant_5921" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 512" offset="44535908" size="2048" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="180" name="__module.layers.3.self_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="181" name="Constant_5922" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 512" offset="44537956" size="2048" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="182" name="__module.layers.3.self_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="304,hidden_states.19">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="183" name="self.layers.3.self_attn.q_proj.weight" type="Const" version="opset1">
<data element_type="f32" shape="512, 512" offset="44540004" size="1048576" />
<output>
<port id="0" precision="FP32" names="self.layers.3.self_attn.q_proj.weight">
<dim>512</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="184" name="__module.layers.3.self_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>512</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="185" name="Constant_5923" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 512" offset="45588580" size="2048" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="186" name="__module.layers.3.self_attn.q_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="313,tensor.19">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="187" name="Constant_6068" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="7768092" size="32" />
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="188" name="__module.layers.3.self_attn/aten::view/Reshape" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="315">
<dim>-1</dim>
<dim>1500</dim>
<dim>8</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="189" name="__module.layers.3.self_attn/aten::transpose/Constant" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="7768124" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="190" name="__module.layers.3.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>8</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="316">
<dim>-1</dim>
<dim>8</dim>
<dim>1500</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="191" name="self.layers.3.self_attn.k_proj.weight" type="Const" version="opset1">
<data element_type="f32" shape="512, 512" offset="45590628" size="1048576" />
<output>
<port id="0" precision="FP32" names="self.layers.3.self_attn.k_proj.weight">
<dim>512</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="192" name="__module.layers.3.self_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>512</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="319,tensor.21">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="193" name="Constant_6069" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="7768092" size="32" />
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="194" name="__module.layers.3.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="321">
<dim>-1</dim>
<dim>1500</dim>
<dim>8</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="195" name="__module.layers.3.self_attn/aten::transpose/Constant_1" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="7768124" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="196" name="__module.layers.3.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>8</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="322">
<dim>-1</dim>
<dim>8</dim>
<dim>1500</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="197" name="self.layers.3.self_attn.v_proj.weight" type="Const" version="opset1">
<data element_type="f32" shape="512, 512" offset="46639204" size="1048576" />
<output>
<port id="0" precision="FP32" names="self.layers.3.self_attn.v_proj.weight">
<dim>512</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="198" name="__module.layers.3.self_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>512</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="199" name="Constant_5924" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 512" offset="47687780" size="2048" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="200" name="__module.layers.3.self_attn.v_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="326,tensor.23">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="201" name="Constant_6070" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="7768092" size="32" />
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="202" name="__module.layers.3.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="328">
<dim>-1</dim>
<dim>1500</dim>
<dim>8</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="203" name="__module.layers.3.self_attn/aten::transpose/Constant_2" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="7768124" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="204" name="__module.layers.3.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>8</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="329">
<dim>-1</dim>
<dim>8</dim>
<dim>1500</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="205" name="__module.layers.3.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13">
<data causal="false" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>8</dim>
<dim>1500</dim>
<dim>64</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>8</dim>
<dim>1500</dim>
<dim>64</dim>
</port>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>8</dim>
<dim>1500</dim>
<dim>64</dim>
</port>
</input>
<output>
<port id="3" precision="FP32" names="331,attn_output.13">
<dim>-1</dim>
<dim>8</dim>
<dim>1500</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="206" name="__module.layers.3.self_attn/aten::transpose/Constant_3" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="7768124" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="207" name="__module.layers.3.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>8</dim>
<dim>1500</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="332,attn_output.15">
<dim>-1</dim>
<dim>1500</dim>
<dim>8</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="208" name="Constant_6071" type="Const" version="opset1">
<data element_type="i64" shape="3" offset="9867340" size="24" />
<output>
<port id="0" precision="I64">
<dim>3</dim>
</port>
</output>
</layer>
<layer id="209" name="__module.layers.3.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>8</dim>
<dim>64</dim>
</port>
<port id="1" precision="I64">
<dim>3</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="334">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="210" name="self.layers.3.self_attn.out_proj.weight" type="Const" version="opset1">
<data element_type="f32" shape="512, 512" offset="47689828" size="1048576" />
<output>
<port id="0" precision="FP32" names="self.layers.3.self_attn.out_proj.weight">
<dim>512</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="211" name="__module.layers.3.self_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>512</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="212" name="Constant_5925" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 512" offset="48738404" size="2048" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="213" name="__module.layers.3.self_attn.out_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="337,input.21">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="214" name="__module.layers.3/aten::add/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="339,residual.15">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="215" name="__module.layers.3.final_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1">
<data element_type="i32" shape="1" offset="6713368" size="4" />
<output>
<port id="0" precision="I32">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="216" name="__module.layers.3.final_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6">
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="I32">
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="217" name="Constant_5926" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 512" offset="48740452" size="2048" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="218" name="__module.layers.3.final_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="219" name="Constant_5927" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 512" offset="48742500" size="2048" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="220" name="__module.layers.3.final_layer_norm/aten::layer_norm/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="343">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="221" name="self.layers.3.fc1.weight" type="Const" version="opset1">
<data element_type="f32" shape="2048, 512" offset="48744548" size="4194304" />
<output>
<port id="0" precision="FP32" names="self.layers.3.fc1.weight">
<dim>2048</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="222" name="__module.layers.3.fc1/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>2048</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>2048</dim>
</port>
</output>
</layer>
<layer id="223" name="Constant_5928" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 2048" offset="52938852" size="8192" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>2048</dim>
</port>
</output>
</layer>
<layer id="224" name="__module.layers.3.fc1/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>2048</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>2048</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="346">
<dim>-1</dim>
<dim>1500</dim>
<dim>2048</dim>
</port>
</output>
</layer>
<layer id="225" name="__module.layers.3.activation_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
<data approximation_mode="ERF" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>2048</dim>
</port>
</input>
<output>
<port id="1" precision="FP32" names="347,input.23">
<dim>-1</dim>
<dim>1500</dim>
<dim>2048</dim>
</port>
</output>
</layer>
<layer id="226" name="self.layers.3.fc2.weight" type="Const" version="opset1">
<data element_type="f32" shape="512, 2048" offset="52947044" size="4194304" />
<output>
<port id="0" precision="FP32" names="self.layers.3.fc2.weight">
<dim>512</dim>
<dim>2048</dim>
</port>
</output>
</layer>
<layer id="227" name="__module.layers.3.fc2/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>2048</dim>
</port>
<port id="1" precision="FP32">
<dim>512</dim>
<dim>2048</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="228" name="Constant_5929" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 512" offset="57141348" size="2048" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="229" name="__module.layers.3.fc2/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="351,input.25">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="230" name="__module.layers.3/aten::add/Add_1" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="353,residual.17">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="231" name="__module.layers.4.self_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1">
<data element_type="i32" shape="1" offset="6713368" size="4" />
<output>
<port id="0" precision="I32">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="232" name="__module.layers.4.self_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6">
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="I32">
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="233" name="Constant_5930" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 512" offset="57143396" size="2048" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="234" name="__module.layers.4.self_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="235" name="Constant_5931" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 512" offset="57145444" size="2048" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="236" name="__module.layers.4.self_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="376,hidden_states.25">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="237" name="self.layers.4.self_attn.q_proj.weight" type="Const" version="opset1">
<data element_type="f32" shape="512, 512" offset="57147492" size="1048576" />
<output>
<port id="0" precision="FP32" names="self.layers.4.self_attn.q_proj.weight">
<dim>512</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="238" name="__module.layers.4.self_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>512</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="239" name="Constant_5932" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 512" offset="58196068" size="2048" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="240" name="__module.layers.4.self_attn.q_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="385,tensor.25">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="241" name="Constant_6072" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="7768092" size="32" />
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="242" name="__module.layers.4.self_attn/aten::view/Reshape" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="387">
<dim>-1</dim>
<dim>1500</dim>
<dim>8</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="243" name="__module.layers.4.self_attn/aten::transpose/Constant" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="7768124" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="244" name="__module.layers.4.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>8</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="388">
<dim>-1</dim>
<dim>8</dim>
<dim>1500</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="245" name="self.layers.4.self_attn.k_proj.weight" type="Const" version="opset1">
<data element_type="f32" shape="512, 512" offset="58198116" size="1048576" />
<output>
<port id="0" precision="FP32" names="self.layers.4.self_attn.k_proj.weight">
<dim>512</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="246" name="__module.layers.4.self_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>512</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="391,tensor.27">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="247" name="Constant_6073" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="7768092" size="32" />
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="248" name="__module.layers.4.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="393">
<dim>-1</dim>
<dim>1500</dim>
<dim>8</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="249" name="__module.layers.4.self_attn/aten::transpose/Constant_1" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="7768124" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="250" name="__module.layers.4.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>8</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="394">
<dim>-1</dim>
<dim>8</dim>
<dim>1500</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="251" name="self.layers.4.self_attn.v_proj.weight" type="Const" version="opset1">
<data element_type="f32" shape="512, 512" offset="59246692" size="1048576" />
<output>
<port id="0" precision="FP32" names="self.layers.4.self_attn.v_proj.weight">
<dim>512</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="252" name="__module.layers.4.self_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>512</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="253" name="Constant_5933" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 512" offset="60295268" size="2048" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="254" name="__module.layers.4.self_attn.v_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="398,tensor.29">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="255" name="Constant_6074" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="7768092" size="32" />
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="256" name="__module.layers.4.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="400">
<dim>-1</dim>
<dim>1500</dim>
<dim>8</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="257" name="__module.layers.4.self_attn/aten::transpose/Constant_2" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="7768124" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="258" name="__module.layers.4.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>8</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="401">
<dim>-1</dim>
<dim>8</dim>
<dim>1500</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="259" name="__module.layers.4.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13">
<data causal="false" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>8</dim>
<dim>1500</dim>
<dim>64</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>8</dim>
<dim>1500</dim>
<dim>64</dim>
</port>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>8</dim>
<dim>1500</dim>
<dim>64</dim>
</port>
</input>
<output>
<port id="3" precision="FP32" names="403,attn_output.17">
<dim>-1</dim>
<dim>8</dim>
<dim>1500</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="260" name="__module.layers.4.self_attn/aten::transpose/Constant_3" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="7768124" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="261" name="__module.layers.4.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>8</dim>
<dim>1500</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="404,attn_output.19">
<dim>-1</dim>
<dim>1500</dim>
<dim>8</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="262" name="Constant_6075" type="Const" version="opset1">
<data element_type="i64" shape="3" offset="9867340" size="24" />
<output>
<port id="0" precision="I64">
<dim>3</dim>
</port>
</output>
</layer>
<layer id="263" name="__module.layers.4.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>8</dim>
<dim>64</dim>
</port>
<port id="1" precision="I64">
<dim>3</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="406">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="264" name="self.layers.4.self_attn.out_proj.weight" type="Const" version="opset1">
<data element_type="f32" shape="512, 512" offset="60297316" size="1048576" />
<output>
<port id="0" precision="FP32" names="self.layers.4.self_attn.out_proj.weight">
<dim>512</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="265" name="__module.layers.4.self_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>512</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="266" name="Constant_5934" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 512" offset="61345892" size="2048" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="267" name="__module.layers.4.self_attn.out_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="409,input.27">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="268" name="__module.layers.4/aten::add/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="411,residual.19">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="269" name="__module.layers.4.final_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1">
<data element_type="i32" shape="1" offset="6713368" size="4" />
<output>
<port id="0" precision="I32">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="270" name="__module.layers.4.final_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6">
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="I32">
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="271" name="Constant_5935" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 512" offset="61347940" size="2048" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="272" name="__module.layers.4.final_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="273" name="Constant_5936" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 512" offset="61349988" size="2048" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="274" name="__module.layers.4.final_layer_norm/aten::layer_norm/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="415">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="275" name="self.layers.4.fc1.weight" type="Const" version="opset1">
<data element_type="f32" shape="2048, 512" offset="61352036" size="4194304" />
<output>
<port id="0" precision="FP32" names="self.layers.4.fc1.weight">
<dim>2048</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="276" name="__module.layers.4.fc1/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>2048</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>2048</dim>
</port>
</output>
</layer>
<layer id="277" name="Constant_5937" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 2048" offset="65546340" size="8192" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>2048</dim>
</port>
</output>
</layer>
<layer id="278" name="__module.layers.4.fc1/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>2048</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>2048</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="418">
<dim>-1</dim>
<dim>1500</dim>
<dim>2048</dim>
</port>
</output>
</layer>
<layer id="279" name="__module.layers.4.activation_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
<data approximation_mode="ERF" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>2048</dim>
</port>
</input>
<output>
<port id="1" precision="FP32" names="419,input.29">
<dim>-1</dim>
<dim>1500</dim>
<dim>2048</dim>
</port>
</output>
</layer>
<layer id="280" name="self.layers.4.fc2.weight" type="Const" version="opset1">
<data element_type="f32" shape="512, 2048" offset="65554532" size="4194304" />
<output>
<port id="0" precision="FP32" names="self.layers.4.fc2.weight">
<dim>512</dim>
<dim>2048</dim>
</port>
</output>
</layer>
<layer id="281" name="__module.layers.4.fc2/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>2048</dim>
</port>
<port id="1" precision="FP32">
<dim>512</dim>
<dim>2048</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="282" name="Constant_5938" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 512" offset="69748836" size="2048" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="283" name="__module.layers.4.fc2/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="423,input.31">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="284" name="__module.layers.4/aten::add/Add_1" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="425,residual.21">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="285" name="__module.layers.5.self_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1">
<data element_type="i32" shape="1" offset="6713368" size="4" />
<output>
<port id="0" precision="I32">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="286" name="__module.layers.5.self_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6">
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="I32">
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="287" name="Constant_5939" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 512" offset="69750884" size="2048" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="288" name="__module.layers.5.self_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="289" name="Constant_5940" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 512" offset="69752932" size="2048" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="290" name="__module.layers.5.self_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="448,hidden_states.31">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="291" name="self.layers.5.self_attn.q_proj.weight" type="Const" version="opset1">
<data element_type="f32" shape="512, 512" offset="69754980" size="1048576" />
<output>
<port id="0" precision="FP32" names="self.layers.5.self_attn.q_proj.weight">
<dim>512</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="292" name="__module.layers.5.self_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>512</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="293" name="Constant_5941" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 512" offset="70803556" size="2048" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="294" name="__module.layers.5.self_attn.q_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="457,tensor.31">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="295" name="Constant_6076" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="7768092" size="32" />
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="296" name="__module.layers.5.self_attn/aten::view/Reshape" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="459">
<dim>-1</dim>
<dim>1500</dim>
<dim>8</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="297" name="__module.layers.5.self_attn/aten::transpose/Constant" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="7768124" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="298" name="__module.layers.5.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>8</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="460">
<dim>-1</dim>
<dim>8</dim>
<dim>1500</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="299" name="self.layers.5.self_attn.k_proj.weight" type="Const" version="opset1">
<data element_type="f32" shape="512, 512" offset="70805604" size="1048576" />
<output>
<port id="0" precision="FP32" names="self.layers.5.self_attn.k_proj.weight">
<dim>512</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="300" name="__module.layers.5.self_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>512</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="463,tensor.33">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="301" name="Constant_6077" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="7768092" size="32" />
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="302" name="__module.layers.5.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="465">
<dim>-1</dim>
<dim>1500</dim>
<dim>8</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="303" name="__module.layers.5.self_attn/aten::transpose/Constant_1" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="7768124" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="304" name="__module.layers.5.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>8</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="466">
<dim>-1</dim>
<dim>8</dim>
<dim>1500</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="305" name="self.layers.5.self_attn.v_proj.weight" type="Const" version="opset1">
<data element_type="f32" shape="512, 512" offset="71854180" size="1048576" />
<output>
<port id="0" precision="FP32" names="self.layers.5.self_attn.v_proj.weight">
<dim>512</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="306" name="__module.layers.5.self_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>512</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="307" name="Constant_5942" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 512" offset="72902756" size="2048" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="308" name="__module.layers.5.self_attn.v_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="470,tensor">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="309" name="Constant_6078" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="7768092" size="32" />
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="310" name="__module.layers.5.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="472">
<dim>-1</dim>
<dim>1500</dim>
<dim>8</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="311" name="__module.layers.5.self_attn/aten::transpose/Constant_2" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="7768124" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="312" name="__module.layers.5.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>8</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="473">
<dim>-1</dim>
<dim>8</dim>
<dim>1500</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="313" name="__module.layers.5.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13">
<data causal="false" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>8</dim>
<dim>1500</dim>
<dim>64</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>8</dim>
<dim>1500</dim>
<dim>64</dim>
</port>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>8</dim>
<dim>1500</dim>
<dim>64</dim>
</port>
</input>
<output>
<port id="3" precision="FP32" names="475,attn_output.21">
<dim>-1</dim>
<dim>8</dim>
<dim>1500</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="314" name="__module.layers.5.self_attn/aten::transpose/Constant_3" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="7768124" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="315" name="__module.layers.5.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>8</dim>
<dim>1500</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="476,attn_output">
<dim>-1</dim>
<dim>1500</dim>
<dim>8</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="316" name="Constant_6079" type="Const" version="opset1">
<data element_type="i64" shape="3" offset="9867340" size="24" />
<output>
<port id="0" precision="I64">
<dim>3</dim>
</port>
</output>
</layer>
<layer id="317" name="__module.layers.5.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>8</dim>
<dim>64</dim>
</port>
<port id="1" precision="I64">
<dim>3</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="478">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="318" name="self.layers.5.self_attn.out_proj.weight" type="Const" version="opset1">
<data element_type="f32" shape="512, 512" offset="72904804" size="1048576" />
<output>
<port id="0" precision="FP32" names="self.layers.5.self_attn.out_proj.weight">
<dim>512</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="319" name="__module.layers.5.self_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>512</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="320" name="Constant_5943" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 512" offset="73953380" size="2048" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="321" name="__module.layers.5.self_attn.out_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="481,input.33">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="322" name="__module.layers.5/aten::add/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="483,residual">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="323" name="__module.layers.5.final_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1">
<data element_type="i32" shape="1" offset="6713368" size="4" />
<output>
<port id="0" precision="I32">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="324" name="__module.layers.5.final_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6">
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="I32">
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="325" name="Constant_5944" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 512" offset="73955428" size="2048" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="326" name="__module.layers.5.final_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="327" name="Constant_5945" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 512" offset="73957476" size="2048" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="328" name="__module.layers.5.final_layer_norm/aten::layer_norm/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="487">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="329" name="self.layers.5.fc1.weight" type="Const" version="opset1">
<data element_type="f32" shape="2048, 512" offset="73959524" size="4194304" />
<output>
<port id="0" precision="FP32" names="self.layers.5.fc1.weight">
<dim>2048</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="330" name="__module.layers.5.fc1/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>2048</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>2048</dim>
</port>
</output>
</layer>
<layer id="331" name="Constant_5946" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 2048" offset="78153828" size="8192" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>2048</dim>
</port>
</output>
</layer>
<layer id="332" name="__module.layers.5.fc1/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>2048</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>2048</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="490">
<dim>-1</dim>
<dim>1500</dim>
<dim>2048</dim>
</port>
</output>
</layer>
<layer id="333" name="__module.layers.5.activation_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
<data approximation_mode="ERF" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>2048</dim>
</port>
</input>
<output>
<port id="1" precision="FP32" names="491,input.35">
<dim>-1</dim>
<dim>1500</dim>
<dim>2048</dim>
</port>
</output>
</layer>
<layer id="334" name="self.layers.5.fc2.weight" type="Const" version="opset1">
<data element_type="f32" shape="512, 2048" offset="78162020" size="4194304" />
<output>
<port id="0" precision="FP32" names="self.layers.5.fc2.weight">
<dim>512</dim>
<dim>2048</dim>
</port>
</output>
</layer>
<layer id="335" name="__module.layers.5.fc2/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>2048</dim>
</port>
<port id="1" precision="FP32">
<dim>512</dim>
<dim>2048</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="336" name="Constant_5947" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 512" offset="82356324" size="2048" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="337" name="__module.layers.5.fc2/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="495,input">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="338" name="__module.layers.5/aten::add/Add_1" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="497">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="339" name="__module.layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1">
<data element_type="i32" shape="1" offset="6713368" size="4" />
<output>
<port id="0" precision="I32">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="340" name="__module.layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6">
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="I32">
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="341" name="Constant_5948" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 512" offset="82358372" size="2048" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="342" name="__module.layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="343" name="Constant_5949" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 512" offset="82360420" size="2048" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="344" name="__module.layer_norm/aten::layer_norm/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>512</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="last_hidden_state">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="345" name="Result_1938" type="Result" version="opset1" output_names="last_hidden_state">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1500</dim>
<dim>512</dim>
</port>
</input>
</layer>
</layers>
<edges>
<edge from-layer="0" from-port="0" to-layer="2" to-port="0" />
<edge from-layer="1" from-port="0" to-layer="2" to-port="1" />
<edge from-layer="2" from-port="2" to-layer="4" to-port="0" />
<edge from-layer="3" from-port="0" to-layer="4" to-port="1" />
<edge from-layer="4" from-port="2" to-layer="5" to-port="0" />
<edge from-layer="5" from-port="1" to-layer="7" to-port="0" />
<edge from-layer="6" from-port="0" to-layer="7" to-port="1" />
<edge from-layer="7" from-port="2" to-layer="9" to-port="0" />
<edge from-layer="8" from-port="0" to-layer="9" to-port="1" />
<edge from-layer="9" from-port="2" to-layer="10" to-port="0" />
<edge from-layer="10" from-port="1" to-layer="12" to-port="0" />
<edge from-layer="11" from-port="0" to-layer="12" to-port="1" />
<edge from-layer="12" from-port="2" to-layer="14" to-port="0" />
<edge from-layer="13" from-port="0" to-layer="14" to-port="1" />
<edge from-layer="14" from-port="2" to-layer="52" to-port="0" />
<edge from-layer="14" from-port="2" to-layer="16" to-port="0" />
<edge from-layer="15" from-port="0" to-layer="16" to-port="1" />
<edge from-layer="16" from-port="2" to-layer="18" to-port="0" />
<edge from-layer="17" from-port="0" to-layer="18" to-port="1" />
<edge from-layer="18" from-port="2" to-layer="20" to-port="0" />
<edge from-layer="19" from-port="0" to-layer="20" to-port="1" />
<edge from-layer="20" from-port="2" to-layer="22" to-port="0" />
<edge from-layer="20" from-port="2" to-layer="36" to-port="0" />
<edge from-layer="20" from-port="2" to-layer="30" to-port="0" />
<edge from-layer="21" from-port="0" to-layer="22" to-port="1" />
<edge from-layer="22" from-port="2" to-layer="24" to-port="0" />
<edge from-layer="23" from-port="0" to-layer="24" to-port="1" />
<edge from-layer="24" from-port="2" to-layer="26" to-port="0" />
<edge from-layer="25" from-port="0" to-layer="26" to-port="1" />
<edge from-layer="26" from-port="2" to-layer="28" to-port="0" />
<edge from-layer="27" from-port="0" to-layer="28" to-port="1" />
<edge from-layer="28" from-port="2" to-layer="43" to-port="0" />
<edge from-layer="29" from-port="0" to-layer="30" to-port="1" />
<edge from-layer="30" from-port="2" to-layer="32" to-port="0" />
<edge from-layer="31" from-port="0" to-layer="32" to-port="1" />
<edge from-layer="32" from-port="2" to-layer="34" to-port="0" />
<edge from-layer="33" from-port="0" to-layer="34" to-port="1" />
<edge from-layer="34" from-port="2" to-layer="43" to-port="1" />
<edge from-layer="35" from-port="0" to-layer="36" to-port="1" />
<edge from-layer="36" from-port="2" to-layer="38" to-port="0" />
<edge from-layer="37" from-port="0" to-layer="38" to-port="1" />
<edge from-layer="38" from-port="2" to-layer="40" to-port="0" />
<edge from-layer="39" from-port="0" to-layer="40" to-port="1" />
<edge from-layer="40" from-port="2" to-layer="42" to-port="0" />
<edge from-layer="41" from-port="0" to-layer="42" to-port="1" />
<edge from-layer="42" from-port="2" to-layer="43" to-port="2" />
<edge from-layer="43" from-port="3" to-layer="45" to-port="0" />
<edge from-layer="44" from-port="0" to-layer="45" to-port="1" />
<edge from-layer="45" from-port="2" to-layer="47" to-port="0" />
<edge from-layer="46" from-port="0" to-layer="47" to-port="1" />
<edge from-layer="47" from-port="2" to-layer="49" to-port="0" />
<edge from-layer="48" from-port="0" to-layer="49" to-port="1" />
<edge from-layer="49" from-port="2" to-layer="51" to-port="0" />
<edge from-layer="50" from-port="0" to-layer="51" to-port="1" />
<edge from-layer="51" from-port="2" to-layer="52" to-port="1" />
<edge from-layer="52" from-port="2" to-layer="54" to-port="0" />
<edge from-layer="52" from-port="2" to-layer="68" to-port="0" />
<edge from-layer="53" from-port="0" to-layer="54" to-port="1" />
<edge from-layer="54" from-port="2" to-layer="56" to-port="0" />
<edge from-layer="55" from-port="0" to-layer="56" to-port="1" />
<edge from-layer="56" from-port="2" to-layer="58" to-port="0" />
<edge from-layer="57" from-port="0" to-layer="58" to-port="1" />
<edge from-layer="58" from-port="2" to-layer="60" to-port="0" />
<edge from-layer="59" from-port="0" to-layer="60" to-port="1" />
<edge from-layer="60" from-port="2" to-layer="62" to-port="0" />
<edge from-layer="61" from-port="0" to-layer="62" to-port="1" />
<edge from-layer="62" from-port="2" to-layer="63" to-port="0" />
<edge from-layer="63" from-port="1" to-layer="65" to-port="0" />
<edge from-layer="64" from-port="0" to-layer="65" to-port="1" />
<edge from-layer="65" from-port="2" to-layer="67" to-port="0" />
<edge from-layer="66" from-port="0" to-layer="67" to-port="1" />
<edge from-layer="67" from-port="2" to-layer="68" to-port="1" />
<edge from-layer="68" from-port="2" to-layer="70" to-port="0" />
<edge from-layer="68" from-port="2" to-layer="106" to-port="0" />
<edge from-layer="69" from-port="0" to-layer="70" to-port="1" />
<edge from-layer="70" from-port="2" to-layer="72" to-port="0" />
<edge from-layer="71" from-port="0" to-layer="72" to-port="1" />
<edge from-layer="72" from-port="2" to-layer="74" to-port="0" />
<edge from-layer="73" from-port="0" to-layer="74" to-port="1" />
<edge from-layer="74" from-port="2" to-layer="84" to-port="0" />
<edge from-layer="74" from-port="2" to-layer="90" to-port="0" />
<edge from-layer="74" from-port="2" to-layer="76" to-port="0" />
<edge from-layer="75" from-port="0" to-layer="76" to-port="1" />
<edge from-layer="76" from-port="2" to-layer="78" to-port="0" />
<edge from-layer="77" from-port="0" to-layer="78" to-port="1" />
<edge from-layer="78" from-port="2" to-layer="80" to-port="0" />
<edge from-layer="79" from-port="0" to-layer="80" to-port="1" />
<edge from-layer="80" from-port="2" to-layer="82" to-port="0" />
<edge from-layer="81" from-port="0" to-layer="82" to-port="1" />
<edge from-layer="82" from-port="2" to-layer="97" to-port="0" />
<edge from-layer="83" from-port="0" to-layer="84" to-port="1" />
<edge from-layer="84" from-port="2" to-layer="86" to-port="0" />
<edge from-layer="85" from-port="0" to-layer="86" to-port="1" />
<edge from-layer="86" from-port="2" to-layer="88" to-port="0" />
<edge from-layer="87" from-port="0" to-layer="88" to-port="1" />
<edge from-layer="88" from-port="2" to-layer="97" to-port="1" />
<edge from-layer="89" from-port="0" to-layer="90" to-port="1" />
<edge from-layer="90" from-port="2" to-layer="92" to-port="0" />
<edge from-layer="91" from-port="0" to-layer="92" to-port="1" />
<edge from-layer="92" from-port="2" to-layer="94" to-port="0" />
<edge from-layer="93" from-port="0" to-layer="94" to-port="1" />
<edge from-layer="94" from-port="2" to-layer="96" to-port="0" />
<edge from-layer="95" from-port="0" to-layer="96" to-port="1" />
<edge from-layer="96" from-port="2" to-layer="97" to-port="2" />
<edge from-layer="97" from-port="3" to-layer="99" to-port="0" />
<edge from-layer="98" from-port="0" to-layer="99" to-port="1" />
<edge from-layer="99" from-port="2" to-layer="101" to-port="0" />
<edge from-layer="100" from-port="0" to-layer="101" to-port="1" />
<edge from-layer="101" from-port="2" to-layer="103" to-port="0" />
<edge from-layer="102" from-port="0" to-layer="103" to-port="1" />
<edge from-layer="103" from-port="2" to-layer="105" to-port="0" />
<edge from-layer="104" from-port="0" to-layer="105" to-port="1" />
<edge from-layer="105" from-port="2" to-layer="106" to-port="1" />
<edge from-layer="106" from-port="2" to-layer="108" to-port="0" />
<edge from-layer="106" from-port="2" to-layer="122" to-port="0" />
<edge from-layer="107" from-port="0" to-layer="108" to-port="1" />
<edge from-layer="108" from-port="2" to-layer="110" to-port="0" />
<edge from-layer="109" from-port="0" to-layer="110" to-port="1" />
<edge from-layer="110" from-port="2" to-layer="112" to-port="0" />
<edge from-layer="111" from-port="0" to-layer="112" to-port="1" />
<edge from-layer="112" from-port="2" to-layer="114" to-port="0" />
<edge from-layer="113" from-port="0" to-layer="114" to-port="1" />
<edge from-layer="114" from-port="2" to-layer="116" to-port="0" />
<edge from-layer="115" from-port="0" to-layer="116" to-port="1" />
<edge from-layer="116" from-port="2" to-layer="117" to-port="0" />
<edge from-layer="117" from-port="1" to-layer="119" to-port="0" />
<edge from-layer="118" from-port="0" to-layer="119" to-port="1" />
<edge from-layer="119" from-port="2" to-layer="121" to-port="0" />
<edge from-layer="120" from-port="0" to-layer="121" to-port="1" />
<edge from-layer="121" from-port="2" to-layer="122" to-port="1" />
<edge from-layer="122" from-port="2" to-layer="124" to-port="0" />
<edge from-layer="122" from-port="2" to-layer="160" to-port="0" />
<edge from-layer="123" from-port="0" to-layer="124" to-port="1" />
<edge from-layer="124" from-port="2" to-layer="126" to-port="0" />
<edge from-layer="125" from-port="0" to-layer="126" to-port="1" />
<edge from-layer="126" from-port="2" to-layer="128" to-port="0" />
<edge from-layer="127" from-port="0" to-layer="128" to-port="1" />
<edge from-layer="128" from-port="2" to-layer="130" to-port="0" />
<edge from-layer="128" from-port="2" to-layer="144" to-port="0" />
<edge from-layer="128" from-port="2" to-layer="138" to-port="0" />
<edge from-layer="129" from-port="0" to-layer="130" to-port="1" />
<edge from-layer="130" from-port="2" to-layer="132" to-port="0" />
<edge from-layer="131" from-port="0" to-layer="132" to-port="1" />
<edge from-layer="132" from-port="2" to-layer="134" to-port="0" />
<edge from-layer="133" from-port="0" to-layer="134" to-port="1" />
<edge from-layer="134" from-port="2" to-layer="136" to-port="0" />
<edge from-layer="135" from-port="0" to-layer="136" to-port="1" />
<edge from-layer="136" from-port="2" to-layer="151" to-port="0" />
<edge from-layer="137" from-port="0" to-layer="138" to-port="1" />
<edge from-layer="138" from-port="2" to-layer="140" to-port="0" />
<edge from-layer="139" from-port="0" to-layer="140" to-port="1" />
<edge from-layer="140" from-port="2" to-layer="142" to-port="0" />
<edge from-layer="141" from-port="0" to-layer="142" to-port="1" />
<edge from-layer="142" from-port="2" to-layer="151" to-port="1" />
<edge from-layer="143" from-port="0" to-layer="144" to-port="1" />
<edge from-layer="144" from-port="2" to-layer="146" to-port="0" />
<edge from-layer="145" from-port="0" to-layer="146" to-port="1" />
<edge from-layer="146" from-port="2" to-layer="148" to-port="0" />
<edge from-layer="147" from-port="0" to-layer="148" to-port="1" />
<edge from-layer="148" from-port="2" to-layer="150" to-port="0" />
<edge from-layer="149" from-port="0" to-layer="150" to-port="1" />
<edge from-layer="150" from-port="2" to-layer="151" to-port="2" />
<edge from-layer="151" from-port="3" to-layer="153" to-port="0" />
<edge from-layer="152" from-port="0" to-layer="153" to-port="1" />
<edge from-layer="153" from-port="2" to-layer="155" to-port="0" />
<edge from-layer="154" from-port="0" to-layer="155" to-port="1" />
<edge from-layer="155" from-port="2" to-layer="157" to-port="0" />
<edge from-layer="156" from-port="0" to-layer="157" to-port="1" />
<edge from-layer="157" from-port="2" to-layer="159" to-port="0" />
<edge from-layer="158" from-port="0" to-layer="159" to-port="1" />
<edge from-layer="159" from-port="2" to-layer="160" to-port="1" />
<edge from-layer="160" from-port="2" to-layer="176" to-port="0" />
<edge from-layer="160" from-port="2" to-layer="162" to-port="0" />
<edge from-layer="161" from-port="0" to-layer="162" to-port="1" />
<edge from-layer="162" from-port="2" to-layer="164" to-port="0" />
<edge from-layer="163" from-port="0" to-layer="164" to-port="1" />
<edge from-layer="164" from-port="2" to-layer="166" to-port="0" />
<edge from-layer="165" from-port="0" to-layer="166" to-port="1" />
<edge from-layer="166" from-port="2" to-layer="168" to-port="0" />
<edge from-layer="167" from-port="0" to-layer="168" to-port="1" />
<edge from-layer="168" from-port="2" to-layer="170" to-port="0" />
<edge from-layer="169" from-port="0" to-layer="170" to-port="1" />
<edge from-layer="170" from-port="2" to-layer="171" to-port="0" />
<edge from-layer="171" from-port="1" to-layer="173" to-port="0" />
<edge from-layer="172" from-port="0" to-layer="173" to-port="1" />
<edge from-layer="173" from-port="2" to-layer="175" to-port="0" />
<edge from-layer="174" from-port="0" to-layer="175" to-port="1" />
<edge from-layer="175" from-port="2" to-layer="176" to-port="1" />
<edge from-layer="176" from-port="2" to-layer="178" to-port="0" />
<edge from-layer="176" from-port="2" to-layer="214" to-port="0" />
<edge from-layer="177" from-port="0" to-layer="178" to-port="1" />
<edge from-layer="178" from-port="2" to-layer="180" to-port="0" />
<edge from-layer="179" from-port="0" to-layer="180" to-port="1" />
<edge from-layer="180" from-port="2" to-layer="182" to-port="0" />
<edge from-layer="181" from-port="0" to-layer="182" to-port="1" />
<edge from-layer="182" from-port="2" to-layer="198" to-port="0" />
<edge from-layer="182" from-port="2" to-layer="192" to-port="0" />
<edge from-layer="182" from-port="2" to-layer="184" to-port="0" />
<edge from-layer="183" from-port="0" to-layer="184" to-port="1" />
<edge from-layer="184" from-port="2" to-layer="186" to-port="0" />
<edge from-layer="185" from-port="0" to-layer="186" to-port="1" />
<edge from-layer="186" from-port="2" to-layer="188" to-port="0" />
<edge from-layer="187" from-port="0" to-layer="188" to-port="1" />
<edge from-layer="188" from-port="2" to-layer="190" to-port="0" />
<edge from-layer="189" from-port="0" to-layer="190" to-port="1" />
<edge from-layer="190" from-port="2" to-layer="205" to-port="0" />
<edge from-layer="191" from-port="0" to-layer="192" to-port="1" />
<edge from-layer="192" from-port="2" to-layer="194" to-port="0" />
<edge from-layer="193" from-port="0" to-layer="194" to-port="1" />
<edge from-layer="194" from-port="2" to-layer="196" to-port="0" />
<edge from-layer="195" from-port="0" to-layer="196" to-port="1" />
<edge from-layer="196" from-port="2" to-layer="205" to-port="1" />
<edge from-layer="197" from-port="0" to-layer="198" to-port="1" />
<edge from-layer="198" from-port="2" to-layer="200" to-port="0" />
<edge from-layer="199" from-port="0" to-layer="200" to-port="1" />
<edge from-layer="200" from-port="2" to-layer="202" to-port="0" />
<edge from-layer="201" from-port="0" to-layer="202" to-port="1" />
<edge from-layer="202" from-port="2" to-layer="204" to-port="0" />
<edge from-layer="203" from-port="0" to-layer="204" to-port="1" />
<edge from-layer="204" from-port="2" to-layer="205" to-port="2" />
<edge from-layer="205" from-port="3" to-layer="207" to-port="0" />
<edge from-layer="206" from-port="0" to-layer="207" to-port="1" />
<edge from-layer="207" from-port="2" to-layer="209" to-port="0" />
<edge from-layer="208" from-port="0" to-layer="209" to-port="1" />
<edge from-layer="209" from-port="2" to-layer="211" to-port="0" />
<edge from-layer="210" from-port="0" to-layer="211" to-port="1" />
<edge from-layer="211" from-port="2" to-layer="213" to-port="0" />
<edge from-layer="212" from-port="0" to-layer="213" to-port="1" />
<edge from-layer="213" from-port="2" to-layer="214" to-port="1" />
<edge from-layer="214" from-port="2" to-layer="216" to-port="0" />
<edge from-layer="214" from-port="2" to-layer="230" to-port="0" />
<edge from-layer="215" from-port="0" to-layer="216" to-port="1" />
<edge from-layer="216" from-port="2" to-layer="218" to-port="0" />
<edge from-layer="217" from-port="0" to-layer="218" to-port="1" />
<edge from-layer="218" from-port="2" to-layer="220" to-port="0" />
<edge from-layer="219" from-port="0" to-layer="220" to-port="1" />
<edge from-layer="220" from-port="2" to-layer="222" to-port="0" />
<edge from-layer="221" from-port="0" to-layer="222" to-port="1" />
<edge from-layer="222" from-port="2" to-layer="224" to-port="0" />
<edge from-layer="223" from-port="0" to-layer="224" to-port="1" />
<edge from-layer="224" from-port="2" to-layer="225" to-port="0" />
<edge from-layer="225" from-port="1" to-layer="227" to-port="0" />
<edge from-layer="226" from-port="0" to-layer="227" to-port="1" />
<edge from-layer="227" from-port="2" to-layer="229" to-port="0" />
<edge from-layer="228" from-port="0" to-layer="229" to-port="1" />
<edge from-layer="229" from-port="2" to-layer="230" to-port="1" />
<edge from-layer="230" from-port="2" to-layer="268" to-port="0" />
<edge from-layer="230" from-port="2" to-layer="232" to-port="0" />
<edge from-layer="231" from-port="0" to-layer="232" to-port="1" />
<edge from-layer="232" from-port="2" to-layer="234" to-port="0" />
<edge from-layer="233" from-port="0" to-layer="234" to-port="1" />
<edge from-layer="234" from-port="2" to-layer="236" to-port="0" />
<edge from-layer="235" from-port="0" to-layer="236" to-port="1" />
<edge from-layer="236" from-port="2" to-layer="252" to-port="0" />
<edge from-layer="236" from-port="2" to-layer="238" to-port="0" />
<edge from-layer="236" from-port="2" to-layer="246" to-port="0" />
<edge from-layer="237" from-port="0" to-layer="238" to-port="1" />
<edge from-layer="238" from-port="2" to-layer="240" to-port="0" />
<edge from-layer="239" from-port="0" to-layer="240" to-port="1" />
<edge from-layer="240" from-port="2" to-layer="242" to-port="0" />
<edge from-layer="241" from-port="0" to-layer="242" to-port="1" />
<edge from-layer="242" from-port="2" to-layer="244" to-port="0" />
<edge from-layer="243" from-port="0" to-layer="244" to-port="1" />
<edge from-layer="244" from-port="2" to-layer="259" to-port="0" />
<edge from-layer="245" from-port="0" to-layer="246" to-port="1" />
<edge from-layer="246" from-port="2" to-layer="248" to-port="0" />
<edge from-layer="247" from-port="0" to-layer="248" to-port="1" />
<edge from-layer="248" from-port="2" to-layer="250" to-port="0" />
<edge from-layer="249" from-port="0" to-layer="250" to-port="1" />
<edge from-layer="250" from-port="2" to-layer="259" to-port="1" />
<edge from-layer="251" from-port="0" to-layer="252" to-port="1" />
<edge from-layer="252" from-port="2" to-layer="254" to-port="0" />
<edge from-layer="253" from-port="0" to-layer="254" to-port="1" />
<edge from-layer="254" from-port="2" to-layer="256" to-port="0" />
<edge from-layer="255" from-port="0" to-layer="256" to-port="1" />
<edge from-layer="256" from-port="2" to-layer="258" to-port="0" />
<edge from-layer="257" from-port="0" to-layer="258" to-port="1" />
<edge from-layer="258" from-port="2" to-layer="259" to-port="2" />
<edge from-layer="259" from-port="3" to-layer="261" to-port="0" />
<edge from-layer="260" from-port="0" to-layer="261" to-port="1" />
<edge from-layer="261" from-port="2" to-layer="263" to-port="0" />
<edge from-layer="262" from-port="0" to-layer="263" to-port="1" />
<edge from-layer="263" from-port="2" to-layer="265" to-port="0" />
<edge from-layer="264" from-port="0" to-layer="265" to-port="1" />
<edge from-layer="265" from-port="2" to-layer="267" to-port="0" />
<edge from-layer="266" from-port="0" to-layer="267" to-port="1" />
<edge from-layer="267" from-port="2" to-layer="268" to-port="1" />
<edge from-layer="268" from-port="2" to-layer="284" to-port="0" />
<edge from-layer="268" from-port="2" to-layer="270" to-port="0" />
<edge from-layer="269" from-port="0" to-layer="270" to-port="1" />
<edge from-layer="270" from-port="2" to-layer="272" to-port="0" />
<edge from-layer="271" from-port="0" to-layer="272" to-port="1" />
<edge from-layer="272" from-port="2" to-layer="274" to-port="0" />
<edge from-layer="273" from-port="0" to-layer="274" to-port="1" />
<edge from-layer="274" from-port="2" to-layer="276" to-port="0" />
<edge from-layer="275" from-port="0" to-layer="276" to-port="1" />
<edge from-layer="276" from-port="2" to-layer="278" to-port="0" />
<edge from-layer="277" from-port="0" to-layer="278" to-port="1" />
<edge from-layer="278" from-port="2" to-layer="279" to-port="0" />
<edge from-layer="279" from-port="1" to-layer="281" to-port="0" />
<edge from-layer="280" from-port="0" to-layer="281" to-port="1" />
<edge from-layer="281" from-port="2" to-layer="283" to-port="0" />
<edge from-layer="282" from-port="0" to-layer="283" to-port="1" />
<edge from-layer="283" from-port="2" to-layer="284" to-port="1" />
<edge from-layer="284" from-port="2" to-layer="286" to-port="0" />
<edge from-layer="284" from-port="2" to-layer="322" to-port="0" />
<edge from-layer="285" from-port="0" to-layer="286" to-port="1" />
<edge from-layer="286" from-port="2" to-layer="288" to-port="0" />
<edge from-layer="287" from-port="0" to-layer="288" to-port="1" />
<edge from-layer="288" from-port="2" to-layer="290" to-port="0" />
<edge from-layer="289" from-port="0" to-layer="290" to-port="1" />
<edge from-layer="290" from-port="2" to-layer="306" to-port="0" />
<edge from-layer="290" from-port="2" to-layer="300" to-port="0" />
<edge from-layer="290" from-port="2" to-layer="292" to-port="0" />
<edge from-layer="291" from-port="0" to-layer="292" to-port="1" />
<edge from-layer="292" from-port="2" to-layer="294" to-port="0" />
<edge from-layer="293" from-port="0" to-layer="294" to-port="1" />
<edge from-layer="294" from-port="2" to-layer="296" to-port="0" />
<edge from-layer="295" from-port="0" to-layer="296" to-port="1" />
<edge from-layer="296" from-port="2" to-layer="298" to-port="0" />
<edge from-layer="297" from-port="0" to-layer="298" to-port="1" />
<edge from-layer="298" from-port="2" to-layer="313" to-port="0" />
<edge from-layer="299" from-port="0" to-layer="300" to-port="1" />
<edge from-layer="300" from-port="2" to-layer="302" to-port="0" />
<edge from-layer="301" from-port="0" to-layer="302" to-port="1" />
<edge from-layer="302" from-port="2" to-layer="304" to-port="0" />
<edge from-layer="303" from-port="0" to-layer="304" to-port="1" />
<edge from-layer="304" from-port="2" to-layer="313" to-port="1" />
<edge from-layer="305" from-port="0" to-layer="306" to-port="1" />
<edge from-layer="306" from-port="2" to-layer="308" to-port="0" />
<edge from-layer="307" from-port="0" to-layer="308" to-port="1" />
<edge from-layer="308" from-port="2" to-layer="310" to-port="0" />
<edge from-layer="309" from-port="0" to-layer="310" to-port="1" />
<edge from-layer="310" from-port="2" to-layer="312" to-port="0" />
<edge from-layer="311" from-port="0" to-layer="312" to-port="1" />
<edge from-layer="312" from-port="2" to-layer="313" to-port="2" />
<edge from-layer="313" from-port="3" to-layer="315" to-port="0" />
<edge from-layer="314" from-port="0" to-layer="315" to-port="1" />
<edge from-layer="315" from-port="2" to-layer="317" to-port="0" />
<edge from-layer="316" from-port="0" to-layer="317" to-port="1" />
<edge from-layer="317" from-port="2" to-layer="319" to-port="0" />
<edge from-layer="318" from-port="0" to-layer="319" to-port="1" />
<edge from-layer="319" from-port="2" to-layer="321" to-port="0" />
<edge from-layer="320" from-port="0" to-layer="321" to-port="1" />
<edge from-layer="321" from-port="2" to-layer="322" to-port="1" />
<edge from-layer="322" from-port="2" to-layer="324" to-port="0" />
<edge from-layer="322" from-port="2" to-layer="338" to-port="0" />
<edge from-layer="323" from-port="0" to-layer="324" to-port="1" />
<edge from-layer="324" from-port="2" to-layer="326" to-port="0" />
<edge from-layer="325" from-port="0" to-layer="326" to-port="1" />
<edge from-layer="326" from-port="2" to-layer="328" to-port="0" />
<edge from-layer="327" from-port="0" to-layer="328" to-port="1" />
<edge from-layer="328" from-port="2" to-layer="330" to-port="0" />
<edge from-layer="329" from-port="0" to-layer="330" to-port="1" />
<edge from-layer="330" from-port="2" to-layer="332" to-port="0" />
<edge from-layer="331" from-port="0" to-layer="332" to-port="1" />
<edge from-layer="332" from-port="2" to-layer="333" to-port="0" />
<edge from-layer="333" from-port="1" to-layer="335" to-port="0" />
<edge from-layer="334" from-port="0" to-layer="335" to-port="1" />
<edge from-layer="335" from-port="2" to-layer="337" to-port="0" />
<edge from-layer="336" from-port="0" to-layer="337" to-port="1" />
<edge from-layer="337" from-port="2" to-layer="338" to-port="1" />
<edge from-layer="338" from-port="2" to-layer="340" to-port="0" />
<edge from-layer="339" from-port="0" to-layer="340" to-port="1" />
<edge from-layer="340" from-port="2" to-layer="342" to-port="0" />
<edge from-layer="341" from-port="0" to-layer="342" to-port="1" />
<edge from-layer="342" from-port="2" to-layer="344" to-port="0" />
<edge from-layer="343" from-port="0" to-layer="344" to-port="1" />
<edge from-layer="344" from-port="2" to-layer="345" to-port="0" />
</edges>
<rt_info>
<Runtime_version value="2025.2.0-19120-87425bc78ca-releases/2025/2" />
<conversion_parameters>
<framework value="pytorch" />
<is_python_object value="True" />
</conversion_parameters>
<optimum>
<optimum_intel_version value="1.24.0.dev0+08e3008" />
<optimum_version value="1.25.3" />
<pytorch_version value="2.7.0+cpu" />
<transformers_version value="4.51.3" />
</optimum>
</rt_info>
</net>