voicescribe-whisper / openvino_decoder_model.xml
Andrewsab's picture
Voice Scribe mirror whisper from FluidInference/whisper-large-v3-turbo-int4-ov-npu@2e8fe5d17cf3
9e40266 verified
<?xml version="1.0"?>
<net name="Model3" version="11">
<layers>
<layer id="1" name="decoder_input_ids" type="Parameter" version="opset1">
<data shape="?,?" element_type="i64" />
<output>
<port id="0" precision="I64" names="input_ids">
<dim>-1</dim>
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="0" name="Parameter_27379" type="Parameter" version="opset1">
<data shape="?,?,?" element_type="f32" />
<output>
<port id="0" precision="FP32" names="encoder_hidden_states">
<dim>-1</dim>
<dim>-1</dim>
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="2" name="self.model.model.decoder.layers.3.encoder_attn.v_proj.weight" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 128" offset="0" size="819200" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="3" name="Convert_934373" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="4" name="self.model.model.decoder.layers.3.encoder_attn.v_proj.weight/zero_point" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 1" offset="819200" size="6400" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="5" name="Convert_934376" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="6" name="self.model.model.decoder.layers.3.encoder_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="7" name="self.model.model.decoder.layers.3.encoder_attn.v_proj.weight/scale" type="Const" version="opset1">
<data element_type="f16" shape="1280, 10, 1" offset="825600" size="25600" />
<output>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="8" name="self.model.model.decoder.layers.3.encoder_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="9" name="Constant_934381" type="Const" version="opset1">
<data element_type="i64" shape="2" offset="851200" size="16" />
<output>
<port id="0" precision="I64">
<dim>2</dim>
</port>
</output>
</layer>
<layer id="10" name="Reshape_934382" type="Reshape" version="opset1">
<data special_zero="false" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="I64">
<dim>2</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="11" name="self.model.model.decoder.layers.3.encoder_attn.v_proj.weight/fq_weights_1/convert" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="12" name="__module.model.model.decoder.layers.3.encoder_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>-1</dim>
</port>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="13" name="Constant_34959" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1280" offset="851216" size="5120" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="14" name="__module.model.model.decoder.layers.3.encoder_attn.v_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="540">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="15" name="ShapeOf_35280" type="ShapeOf" version="opset3">
<data output_type="i64" />
<input>
<port id="0" precision="I64">
<dim>-1</dim>
<dim>-1</dim>
</port>
</input>
<output>
<port id="1" precision="I64">
<dim>2</dim>
</port>
</output>
</layer>
<layer id="16" name="Constant_35281" type="Const" version="opset1">
<data element_type="i64" shape="1" offset="856336" size="8" />
<output>
<port id="0" precision="I64">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="17" name="Constant_35282" type="Const" version="opset1">
<data element_type="i64" shape="" offset="856336" size="8" />
<output>
<port id="0" precision="I64" />
</output>
</layer>
<layer id="18" name="Gather_35283" type="Gather" version="opset8">
<data batch_dims="0" />
<input>
<port id="0" precision="I64">
<dim>2</dim>
</port>
<port id="1" precision="I64">
<dim>1</dim>
</port>
<port id="2" precision="I64" />
</input>
<output>
<port id="3" precision="I64" names="123,171,241,289,359,407,477,525,68,93">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="19" name="Constant_25155" type="Const" version="opset1">
<data element_type="i64" shape="1" offset="856344" size="8" />
<output>
<port id="0" precision="I64">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="20" name="Constant_25156" type="Const" version="opset1">
<data element_type="i64" shape="1" offset="856352" size="8" />
<output>
<port id="0" precision="I64">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="21" name="Constant_25157" type="Const" version="opset1">
<data element_type="i64" shape="1" offset="856360" size="8" />
<output>
<port id="0" precision="I64">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="22" name="__module.model.model.decoder.layers.0.self_attn/prim::ListConstruct_1" type="Concat" version="opset1">
<data axis="0" />
<input>
<port id="0" precision="I64">
<dim>1</dim>
</port>
<port id="1" precision="I64">
<dim>1</dim>
</port>
<port id="2" precision="I64">
<dim>1</dim>
</port>
<port id="3" precision="I64">
<dim>1</dim>
</port>
</input>
<output>
<port id="4" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="23" name="__module.model.model.decoder.layers.3.encoder_attn/aten::view/Reshape" type="Reshape" version="opset1">
<data special_zero="false" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="542,value_states.29">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="24" name="__module.model.model.decoder.layers.3.encoder_attn/aten::transpose/Constant" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="856368" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="25" name="__module.model.model.decoder.layers.3.encoder_attn/aten::transpose/Transpose" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="present.3.encoder.value">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="27" name="self.model.model.decoder.layers.3.encoder_attn.k_proj.weight" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 128" offset="856384" size="819200" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="28" name="Convert_938672" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="29" name="self.model.model.decoder.layers.3.encoder_attn.k_proj.weight/zero_point" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 1" offset="1675584" size="6400" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="30" name="Convert_938675" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="31" name="self.model.model.decoder.layers.3.encoder_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="32" name="self.model.model.decoder.layers.3.encoder_attn.k_proj.weight/scale" type="Const" version="opset1">
<data element_type="f16" shape="1280, 10, 1" offset="1681984" size="25600" />
<output>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="33" name="self.model.model.decoder.layers.3.encoder_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="34" name="Constant_938680" type="Const" version="opset1">
<data element_type="i64" shape="2" offset="851200" size="16" />
<output>
<port id="0" precision="I64">
<dim>2</dim>
</port>
</output>
</layer>
<layer id="35" name="Reshape_938681" type="Reshape" version="opset1">
<data special_zero="false" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="I64">
<dim>2</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="36" name="self.model.model.decoder.layers.3.encoder_attn.k_proj.weight/fq_weights_1/convert" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="37" name="__module.model.model.decoder.layers.3.encoder_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>-1</dim>
</port>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="535">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="38" name="__module.model.model.decoder.layers.3.encoder_attn/aten::view/Reshape_1" type="Reshape" version="opset1">
<data special_zero="false" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="537,key_states.29">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="39" name="__module.model.model.decoder.layers.3.encoder_attn/aten::transpose/Constant_1" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="856368" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="40" name="__module.model.model.decoder.layers.3.encoder_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="present.3.encoder.key">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="42" name="self.model.model.decoder.embed_tokens.weight" type="Const" version="opset1">
<data element_type="u8" shape="51866, 1280" offset="1707584" size="66388480" />
<output>
<port id="0" precision="U8">
<dim>51866</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="43" name="Convert_895684" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U8">
<dim>51866</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>51866</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="44" name="self.model.model.decoder.embed_tokens.weight/zero_point" type="Const" version="opset1">
<data element_type="u8" shape="51866, 1" offset="68096064" size="51866" />
<output>
<port id="0" precision="U8">
<dim>51866</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="45" name="Convert_895687" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U8">
<dim>51866</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>51866</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="46" name="self.model.model.decoder.embed_tokens.weight/zero_point/subtract" type="Subtract" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>51866</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP16">
<dim>51866</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>51866</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="47" name="self.model.model.decoder.embed_tokens.weight/scale" type="Const" version="opset1">
<data element_type="f16" shape="51866, 1" offset="68147930" size="103732" />
<output>
<port id="0" precision="FP16">
<dim>51866</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="48" name="self.model.model.decoder.embed_tokens.weight/fq_weights_0" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>51866</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP16">
<dim>51866</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>51866</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="49" name="self.model.model.decoder.embed_tokens.weight/fq_weights_0/convert" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="FP16">
<dim>51866</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>51866</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="50" name="Constant_35406" type="Const" version="opset1">
<data element_type="i64" shape="2" offset="68251662" size="16" />
<output>
<port id="0" precision="I64">
<dim>2</dim>
</port>
</output>
</layer>
<layer id="51" name="__module.model.model.decoder/aten::view/Reshape" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="I64">
<dim>-1</dim>
<dim>-1</dim>
</port>
<port id="1" precision="I64">
<dim>2</dim>
</port>
</input>
<output>
<port id="2" precision="I64" names="72,input.1">
<dim>-1</dim>
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="52" name="__module.model.model.decoder.embed_tokens/aten::embedding/Convert" type="Convert" version="opset1">
<data destination_type="i32" />
<input>
<port id="0" precision="I64">
<dim>-1</dim>
<dim>-1</dim>
</port>
</input>
<output>
<port id="1" precision="I32">
<dim>-1</dim>
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="53" name="__module.model.model.decoder.embed_tokens/aten::embedding/Constant" type="Const" version="opset1">
<data element_type="i32" shape="" offset="68251678" size="4" />
<output>
<port id="0" precision="I32" />
</output>
</layer>
<layer id="54" name="__module.model.model.decoder.embed_tokens/aten::embedding/Gather" type="Gather" version="opset8">
<data batch_dims="0" />
<input>
<port id="0" precision="FP32">
<dim>51866</dim>
<dim>1280</dim>
</port>
<port id="1" precision="I32">
<dim>-1</dim>
<dim>-1</dim>
</port>
<port id="2" precision="I32" />
</input>
<output>
<port id="3" precision="FP32" names="74,inputs_embeds">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="55" name="self.model.model.decoder.embed_positions.weight" type="Const" version="opset1">
<data element_type="u8" shape="448, 1280" offset="68251682" size="573440" />
<output>
<port id="0" precision="U8">
<dim>448</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="56" name="Convert_1071939" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U8">
<dim>448</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>448</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="57" name="self.model.model.decoder.embed_positions.weight/zero_point" type="Const" version="opset1">
<data element_type="u8" shape="448, 1" offset="68825122" size="448" />
<output>
<port id="0" precision="U8">
<dim>448</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="58" name="Convert_1071942" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U8">
<dim>448</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>448</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="59" name="self.model.model.decoder.embed_positions.weight/zero_point/subtract" type="Subtract" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>448</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP16">
<dim>448</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>448</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="60" name="self.model.model.decoder.embed_positions.weight/scale" type="Const" version="opset1">
<data element_type="f16" shape="448, 1" offset="68825570" size="896" />
<output>
<port id="0" precision="FP16">
<dim>448</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="61" name="self.model.model.decoder.embed_positions.weight/fq_weights_0" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>448</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP16">
<dim>448</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>448</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="62" name="self.model.model.decoder.embed_positions.weight/fq_weights_0/convert" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="FP16">
<dim>448</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>448</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="63" name="49" type="Const" version="opset1">
<data element_type="i64" shape="" offset="856336" size="8" />
<output>
<port id="0" precision="I64" names="49" />
</output>
</layer>
<layer id="64" name="Constant_35273" type="Const" version="opset1">
<data element_type="i64" shape="" offset="68826466" size="8" />
<output>
<port id="0" precision="I64" />
</output>
</layer>
<layer id="65" name="Constant_35274" type="Const" version="opset1">
<data element_type="i64" shape="" offset="856336" size="8" />
<output>
<port id="0" precision="I64" />
</output>
</layer>
<layer id="66" name="Gather_35275" type="Gather" version="opset8">
<data batch_dims="0" />
<input>
<port id="0" precision="I64">
<dim>2</dim>
</port>
<port id="1" precision="I64" />
<port id="2" precision="I64" />
</input>
<output>
<port id="3" precision="I64" names="69,75,87,89" />
</output>
</layer>
<layer id="67" name="__module.model.model.decoder/aten::arange/Constant" type="Const" version="opset1">
<data element_type="i32" shape="" offset="68826474" size="4" />
<output>
<port id="0" precision="I32" />
</output>
</layer>
<layer id="68" name="__module.model.model.decoder/aten::arange/Range" type="Range" version="opset4">
<data output_type="f32" />
<input>
<port id="0" precision="I64" />
<port id="1" precision="I64" />
<port id="2" precision="I32" />
</input>
<output>
<port id="3" precision="FP32" names="77,cache_position">
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="69" name="__module.model.model.decoder/aten::unsqueeze/Unsqueeze" type="Unsqueeze" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
</port>
<port id="1" precision="I64" />
</input>
<output>
<port id="2" precision="FP32" names="78">
<dim>1</dim>
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="70" name="Constant_27765" type="Const" version="opset1">
<data element_type="i64" shape="1" offset="68826466" size="8" />
<output>
<port id="0" precision="I64">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="71" name="__module.model.model.decoder/prim::ListConstruct/Concat" type="Concat" version="opset1">
<data axis="0" />
<input>
<port id="0" precision="I64">
<dim>1</dim>
</port>
<port id="1" precision="I64">
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="I64" names="79">
<dim>2</dim>
</port>
</output>
</layer>
<layer id="72" name="__module.model.model.decoder/aten::repeat/Tile" type="Tile" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>-1</dim>
</port>
<port id="1" precision="I64">
<dim>2</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="80,position_ids">
<dim>-1</dim>
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="73" name="__module.model.model.decoder.embed_positions/aten::index/Convert" type="Convert" version="opset1">
<data destination_type="i32" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
</port>
</input>
<output>
<port id="1" precision="I32">
<dim>-1</dim>
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="74" name="__module.model.model.decoder.embed_positions/aten::index/Constant" type="Const" version="opset1">
<data element_type="i32" shape="" offset="68251678" size="4" />
<output>
<port id="0" precision="I32" />
</output>
</layer>
<layer id="75" name="__module.model.model.decoder.embed_positions/aten::index/Gather" type="Gather" version="opset8">
<data batch_dims="0" />
<input>
<port id="0" precision="FP32">
<dim>448</dim>
<dim>1280</dim>
</port>
<port id="1" precision="I32">
<dim>-1</dim>
<dim>-1</dim>
</port>
<port id="2" precision="I32" />
</input>
<output>
<port id="3" precision="FP32" names="83,84,positions,positions.1">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="76" name="__module.model.model.decoder/aten::add/Add_1" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="85,input.3">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="77" name="__module.model.model.decoder.layers.0.self_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1">
<data element_type="i32" shape="1" offset="68826478" size="4" />
<output>
<port id="0" precision="I32">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="78" name="__module.model.model.decoder.layers.0.self_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6">
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="I32">
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="79" name="Constant_34960" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1280" offset="68826482" size="5120" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="80" name="__module.model.model.decoder.layers.0.self_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="81" name="Constant_34961" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1280" offset="68831602" size="5120" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="82" name="__module.model.model.decoder.layers.0.self_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="118,hidden_states.1">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="83" name="self.model.model.decoder.layers.0.self_attn.q_proj.weight" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 128" offset="68836722" size="819200" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="84" name="Convert_977363" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="85" name="self.model.model.decoder.layers.0.self_attn.q_proj.weight/zero_point" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 1" offset="69655922" size="6400" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="86" name="Convert_977366" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="87" name="self.model.model.decoder.layers.0.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="88" name="self.model.model.decoder.layers.0.self_attn.q_proj.weight/scale" type="Const" version="opset1">
<data element_type="f16" shape="1280, 10, 1" offset="69662322" size="25600" />
<output>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="89" name="self.model.model.decoder.layers.0.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="90" name="Constant_977371" type="Const" version="opset1">
<data element_type="i64" shape="2" offset="851200" size="16" />
<output>
<port id="0" precision="I64">
<dim>2</dim>
</port>
</output>
</layer>
<layer id="91" name="Reshape_977372" type="Reshape" version="opset1">
<data special_zero="false" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="I64">
<dim>2</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="92" name="self.model.model.decoder.layers.0.self_attn.q_proj.weight/fq_weights_1/convert" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="93" name="__module.model.model.decoder.layers.0.self_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="94" name="Constant_34962" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1280" offset="69687922" size="5120" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="95" name="__module.model.model.decoder.layers.0.self_attn.q_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="127">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="96" name="Constant_35407" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="69693042" size="32" />
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="97" name="__module.model.model.decoder.layers.0.self_attn/aten::view/Reshape" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="129,query_states.1">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="98" name="__module.model.model.decoder.layers.0.self_attn/aten::transpose/Constant" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="856368" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="99" name="__module.model.model.decoder.layers.0.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="130">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="100" name="self.model.model.decoder.layers.0.self_attn.k_proj.weight" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 128" offset="69693074" size="819200" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="101" name="Convert_973064" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="102" name="self.model.model.decoder.layers.0.self_attn.k_proj.weight/zero_point" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 1" offset="70512274" size="6400" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="103" name="Convert_973067" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="104" name="self.model.model.decoder.layers.0.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="105" name="self.model.model.decoder.layers.0.self_attn.k_proj.weight/scale" type="Const" version="opset1">
<data element_type="f16" shape="1280, 10, 1" offset="70518674" size="25600" />
<output>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="106" name="self.model.model.decoder.layers.0.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="107" name="Constant_973072" type="Const" version="opset1">
<data element_type="i64" shape="2" offset="851200" size="16" />
<output>
<port id="0" precision="I64">
<dim>2</dim>
</port>
</output>
</layer>
<layer id="108" name="Reshape_973073" type="Reshape" version="opset1">
<data special_zero="false" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="I64">
<dim>2</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="109" name="self.model.model.decoder.layers.0.self_attn.k_proj.weight/fq_weights_1/convert" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="110" name="__module.model.model.decoder.layers.0.self_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="133">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="111" name="Constant_35408" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="69693042" size="32" />
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="112" name="__module.model.model.decoder.layers.0.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="135,key_states.1">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="113" name="__module.model.model.decoder.layers.0.self_attn/aten::transpose/Constant_1" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="856368" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="114" name="__module.model.model.decoder.layers.0.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="present.0.decoder.key">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="115" name="self.model.model.decoder.layers.0.self_attn.v_proj.weight" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 128" offset="70544274" size="819200" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="116" name="Convert_968765" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="117" name="self.model.model.decoder.layers.0.self_attn.v_proj.weight/zero_point" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 1" offset="71363474" size="6400" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="118" name="Convert_968768" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="119" name="self.model.model.decoder.layers.0.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="120" name="self.model.model.decoder.layers.0.self_attn.v_proj.weight/scale" type="Const" version="opset1">
<data element_type="f16" shape="1280, 10, 1" offset="71369874" size="25600" />
<output>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="121" name="self.model.model.decoder.layers.0.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="122" name="Constant_968773" type="Const" version="opset1">
<data element_type="i64" shape="2" offset="851200" size="16" />
<output>
<port id="0" precision="I64">
<dim>2</dim>
</port>
</output>
</layer>
<layer id="123" name="Reshape_968774" type="Reshape" version="opset1">
<data special_zero="false" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="I64">
<dim>2</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="124" name="self.model.model.decoder.layers.0.self_attn.v_proj.weight/fq_weights_1/convert" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="125" name="__module.model.model.decoder.layers.0.self_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="126" name="Constant_34963" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1280" offset="71395474" size="5120" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="127" name="__module.model.model.decoder.layers.0.self_attn.v_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="138">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="128" name="Constant_35409" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="69693042" size="32" />
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="129" name="__module.model.model.decoder.layers.0.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="140,value_states.1">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="130" name="__module.model.model.decoder.layers.0.self_attn/aten::transpose/Constant_2" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="856368" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="131" name="__module.model.model.decoder.layers.0.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="present.0.decoder.value">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="132" name="__module.model.model.decoder/aten::triu/Constant" type="Const" version="opset1">
<data element_type="i32" shape="" offset="68251678" size="4" />
<output>
<port id="0" precision="I32" />
</output>
</layer>
<layer id="133" name="__module.model.model.decoder/aten::full/Convert" type="Const" version="opset1">
<data element_type="f32" shape="" offset="71400594" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="134" name="Constant_35298" type="Const" version="opset1">
<data element_type="i64" shape="1" offset="68826466" size="8" />
<output>
<port id="0" precision="I64">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="135" name="Reshape_35299" type="Reshape" version="opset1">
<data special_zero="false" />
<input>
<port id="0" precision="I64" />
<port id="1" precision="I64">
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="I64" names="145,263,381,499">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="136" name="__module.model.model.decoder/aten::add/Multiply_3" type="Const" version="opset1">
<data element_type="i64" shape="" offset="68826466" size="8" />
<output>
<port id="0" precision="I64" />
</output>
</layer>
<layer id="137" name="__module.model.model.decoder/aten::add/Add_3" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="I64" />
<port id="1" precision="I64" />
</input>
<output>
<port id="2" precision="I64" names="90,92,target_length" />
</output>
</layer>
<layer id="138" name="Constant_24906" type="Const" version="opset1">
<data element_type="i32" shape="" offset="68251678" size="4" />
<output>
<port id="0" precision="I32" />
</output>
</layer>
<layer id="139" name="Unsqueeze_24907" type="Unsqueeze" version="opset1">
<input>
<port id="0" precision="I64" />
<port id="1" precision="I32" />
</input>
<output>
<port id="2" precision="I64">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="140" name="__module.model.model.decoder/prim::ListConstruct_1" type="Concat" version="opset1">
<data axis="0" />
<input>
<port id="0" precision="I64">
<dim>1</dim>
</port>
<port id="1" precision="I64">
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="I64">
<dim>2</dim>
</port>
</output>
</layer>
<layer id="141" name="__module.model.model.decoder/aten::full/Broadcast" type="Broadcast" version="opset3">
<data mode="numpy" />
<input>
<port id="0" precision="FP32" />
<port id="1" precision="I64">
<dim>2</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="95,causal_mask.1">
<dim>-1</dim>
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="142" name="ShapeOf_35305" type="ShapeOf" version="opset3">
<data output_type="i32" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
</port>
</input>
<output>
<port id="1" precision="I32">
<dim>2</dim>
</port>
</output>
</layer>
<layer id="143" name="Constant_35306" type="Const" version="opset1">
<data element_type="i64" shape="" offset="68826466" size="8" />
<output>
<port id="0" precision="I64" />
</output>
</layer>
<layer id="144" name="Constant_35307" type="Const" version="opset1">
<data element_type="i64" shape="" offset="856336" size="8" />
<output>
<port id="0" precision="I64" />
</output>
</layer>
<layer id="145" name="Gather_35308" type="Gather" version="opset8">
<data batch_dims="0" />
<input>
<port id="0" precision="I32">
<dim>2</dim>
</port>
<port id="1" precision="I64" />
<port id="2" precision="I64" />
</input>
<output>
<port id="3" precision="I32" />
</output>
</layer>
<layer id="146" name="__module.model.model.decoder/aten::triu/Constant_2" type="Const" version="opset1">
<data element_type="i32" shape="" offset="68826474" size="4" />
<output>
<port id="0" precision="I32" />
</output>
</layer>
<layer id="147" name="__module.model.model.decoder/aten::triu/Range" type="Range" version="opset4">
<data output_type="i32" />
<input>
<port id="0" precision="I32" />
<port id="1" precision="I32" />
<port id="2" precision="I32" />
</input>
<output>
<port id="3" precision="I32">
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="148" name="__module.model.model.decoder/aten::triu/Unsqueeze" type="Unsqueeze" version="opset1">
<input>
<port id="0" precision="I32">
<dim>-1</dim>
</port>
<port id="1" precision="I32" />
</input>
<output>
<port id="2" precision="I32">
<dim>1</dim>
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="149" name="__module.model.model.decoder/aten::triu/Convert" type="Const" version="opset1">
<data element_type="i32" shape="" offset="68826474" size="4" />
<output>
<port id="0" precision="I32" />
</output>
</layer>
<layer id="150" name="Convert_35311" type="Convert" version="opset1">
<data destination_type="i32" />
<input>
<port id="0" precision="I64" />
</input>
<output>
<port id="1" precision="I32" />
</output>
</layer>
<layer id="151" name="__module.model.model.decoder/aten::triu/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="I32" />
<port id="1" precision="I32" />
</input>
<output>
<port id="2" precision="I32" />
</output>
</layer>
<layer id="152" name="__module.model.model.decoder/aten::triu/Range_1" type="Range" version="opset4">
<data output_type="i32" />
<input>
<port id="0" precision="I32" />
<port id="1" precision="I32" />
<port id="2" precision="I32" />
</input>
<output>
<port id="3" precision="I32">
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="153" name="__module.model.model.decoder/aten::triu/Unsqueeze_1" type="Unsqueeze" version="opset1">
<input>
<port id="0" precision="I32">
<dim>-1</dim>
</port>
<port id="1" precision="I32" />
</input>
<output>
<port id="2" precision="I32">
<dim>-1</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="154" name="__module.model.model.decoder/aten::triu/GreaterEqual" type="GreaterEqual" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="I32">
<dim>1</dim>
<dim>-1</dim>
</port>
<port id="1" precision="I32">
<dim>-1</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="BOOL">
<dim>-1</dim>
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="155" name="__module.model.model.decoder/aten::triu/ConvertLike" type="Const" version="opset1">
<data element_type="f32" shape="" offset="68251678" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="156" name="__module.model.model.decoder/aten::triu/Select" type="Select" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="BOOL">
<dim>-1</dim>
<dim>-1</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
</port>
<port id="2" precision="FP32" />
</input>
<output>
<port id="3" precision="FP32" names="96_1">
<dim>-1</dim>
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="157" name="__module.model.model.decoder/aten::arange/Constant_1" type="Const" version="opset1">
<data element_type="i32" shape="" offset="68251678" size="4" />
<output>
<port id="0" precision="I32" />
</output>
</layer>
<layer id="158" name="__module.model.model.decoder/aten::arange/Constant_2" type="Const" version="opset1">
<data element_type="i32" shape="" offset="68826474" size="4" />
<output>
<port id="0" precision="I32" />
</output>
</layer>
<layer id="159" name="__module.model.model.decoder/aten::arange/Range_1" type="Range" version="opset4">
<data output_type="f32" />
<input>
<port id="0" precision="I32" />
<port id="1" precision="I64" />
<port id="2" precision="I32" />
</input>
<output>
<port id="3" precision="FP32">
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="160" name="__module.model.model.decoder/aten::arange/ConvertLike" type="Convert" version="opset1">
<data destination_type="i64" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
</port>
</input>
<output>
<port id="1" precision="I64" names="97">
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="161" name="__module.model.model.decoder/aten::gt/Convert" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="I64">
<dim>-1</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="162" name="Constant_25009" type="Const" version="opset1">
<data element_type="i64" shape="2" offset="71400598" size="16" />
<output>
<port id="0" precision="I64" names="98">
<dim>2</dim>
</port>
</output>
</layer>
<layer id="163" name="__module.model.model.decoder/aten::reshape/Reshape" type="Reshape" version="opset1">
<data special_zero="false" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
</port>
<port id="1" precision="I64">
<dim>2</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="99">
<dim>-1</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="164" name="__module.model.model.decoder/aten::gt/Greater" type="Greater" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="BOOL" names="100">
<dim>-1</dim>
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="165" name="__module.model.model.decoder/aten::mul_/ConvertLike" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="BOOL">
<dim>-1</dim>
<dim>-1</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="166" name="__module.model.model.decoder/aten::mul_/Multiply" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="96,causal_mask.3">
<dim>-1</dim>
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="167" name="__module.model.model.decoder/aten::unsqueeze/Unsqueeze_1" type="Unsqueeze" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
</port>
<port id="1" precision="I64" />
</input>
<output>
<port id="2" precision="FP32" names="102">
<dim>1</dim>
<dim>-1</dim>
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="168" name="48" type="Const" version="opset1">
<data element_type="i64" shape="" offset="68826466" size="8" />
<output>
<port id="0" precision="I64" names="48" />
</output>
</layer>
<layer id="169" name="__module.model.model.decoder/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>-1</dim>
<dim>-1</dim>
</port>
<port id="1" precision="I64" />
</input>
<output>
<port id="2" precision="FP32" names="103,104,105">
<dim>1</dim>
<dim>1</dim>
<dim>-1</dim>
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="170" name="Constant_32723" type="Const" version="opset1">
<data element_type="i64" shape="1" offset="68826466" size="8" />
<output>
<port id="0" precision="I64">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="171" name="Constant_32725" type="Const" version="opset1">
<data element_type="i64" shape="1" offset="68826466" size="8" />
<output>
<port id="0" precision="I64">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="172" name="Constant_32727" type="Const" version="opset1">
<data element_type="i64" shape="1" offset="68826466" size="8" />
<output>
<port id="0" precision="I64">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="173" name="__module.model.model.decoder/prim::ListConstruct_2" type="Concat" version="opset1">
<data axis="0" />
<input>
<port id="0" precision="I64">
<dim>1</dim>
</port>
<port id="1" precision="I64">
<dim>1</dim>
</port>
<port id="2" precision="I64">
<dim>1</dim>
</port>
<port id="3" precision="I64">
<dim>1</dim>
</port>
</input>
<output>
<port id="4" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="174" name="__module.model.model.decoder/aten::expand/Broadcast" type="Broadcast" version="opset3">
<data mode="bidirectional" />
<input>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>-1</dim>
<dim>-1</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="107,146,147,148,264,265,266,382,383,384,500,501,502,attention_mask">
<dim>-1</dim>
<dim>1</dim>
<dim>-1</dim>
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="175" name="Constant_25279" type="Const" version="opset1">
<data element_type="i64" shape="1" offset="856336" size="8" />
<output>
<port id="0" precision="I64">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="176" name="Constant_25282" type="Const" version="opset1">
<data element_type="i64" shape="1" offset="68826466" size="8" />
<output>
<port id="0" precision="I64">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="177" name="Constant_25277" type="Const" version="opset1">
<data element_type="i64" shape="1" offset="71400614" size="8" />
<output>
<port id="0" precision="I64">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="178" name="__module.model.model.decoder.layers.0.self_attn/aten::slice/Slice_3" type="Slice" version="opset8">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1</dim>
<dim>-1</dim>
<dim>-1</dim>
</port>
<port id="1" precision="I64">
<dim>1</dim>
</port>
<port id="2" precision="I64">
<dim>1</dim>
</port>
<port id="3" precision="I64">
<dim>1</dim>
</port>
<port id="4" precision="I64">
<dim>1</dim>
</port>
</input>
<output>
<port id="5" precision="FP32" names="149,267,385,503,causal_mask,causal_mask.11,causal_mask.7,causal_mask.9">
<dim>-1</dim>
<dim>1</dim>
<dim>-1</dim>
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="179" name="__module.model.model.decoder.layers.0.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13">
<data causal="false" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
<port id="3" precision="FP32">
<dim>-1</dim>
<dim>1</dim>
<dim>-1</dim>
<dim>-1</dim>
</port>
</input>
<output>
<port id="4" precision="FP32" names="150,attn_output.1">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="180" name="__module.model.model.decoder.layers.0.self_attn/aten::transpose/Constant_3" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="856368" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="181" name="__module.model.model.decoder.layers.0.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="151,attn_output.3">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="182" name="Constant_35410" type="Const" version="opset1">
<data element_type="i64" shape="3" offset="71400622" size="24" />
<output>
<port id="0" precision="I64">
<dim>3</dim>
</port>
</output>
</layer>
<layer id="183" name="__module.model.model.decoder.layers.0.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
<port id="1" precision="I64">
<dim>3</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="153,input.7">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="184" name="self.model.model.decoder.layers.0.self_attn.out_proj.weight" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 128" offset="71400646" size="819200" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="185" name="Convert_981662" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="186" name="self.model.model.decoder.layers.0.self_attn.out_proj.weight/zero_point" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 1" offset="72219846" size="6400" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="187" name="Convert_981665" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="188" name="self.model.model.decoder.layers.0.self_attn.out_proj.weight/zero_point/subtract" type="Subtract" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="189" name="self.model.model.decoder.layers.0.self_attn.out_proj.weight/scale" type="Const" version="opset1">
<data element_type="f16" shape="1280, 10, 1" offset="72226246" size="25600" />
<output>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="190" name="self.model.model.decoder.layers.0.self_attn.out_proj.weight/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="191" name="Constant_981670" type="Const" version="opset1">
<data element_type="i64" shape="2" offset="851200" size="16" />
<output>
<port id="0" precision="I64">
<dim>2</dim>
</port>
</output>
</layer>
<layer id="192" name="Reshape_981671" type="Reshape" version="opset1">
<data special_zero="false" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="I64">
<dim>2</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="193" name="self.model.model.decoder.layers.0.self_attn.out_proj.weight/fq_weights_1/convert" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="194" name="__module.model.model.decoder.layers.0.self_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="195" name="Constant_34964" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1280" offset="72251846" size="5120" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="196" name="__module.model.model.decoder.layers.0.self_attn.out_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="156,158,input.9">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="197" name="__module.model.model.decoder.layers.0/aten::add/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="162,input.11">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="198" name="__module.model.model.decoder.layers.0.encoder_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1">
<data element_type="i32" shape="1" offset="68826478" size="4" />
<output>
<port id="0" precision="I32">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="199" name="__module.model.model.decoder.layers.0.encoder_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6">
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="I32">
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="200" name="Constant_34965" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1280" offset="72256966" size="5120" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="201" name="__module.model.model.decoder.layers.0.encoder_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="202" name="Constant_34966" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1280" offset="72262086" size="5120" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="203" name="__module.model.model.decoder.layers.0.encoder_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="166,hidden_states.5">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="204" name="self.model.model.decoder.layers.0.encoder_attn.q_proj.weight" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 128" offset="72267206" size="819200" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="205" name="Convert_985961" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="206" name="self.model.model.decoder.layers.0.encoder_attn.q_proj.weight/zero_point" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 1" offset="73086406" size="6400" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="207" name="Convert_985964" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="208" name="self.model.model.decoder.layers.0.encoder_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="209" name="self.model.model.decoder.layers.0.encoder_attn.q_proj.weight/scale" type="Const" version="opset1">
<data element_type="f16" shape="1280, 10, 1" offset="73092806" size="25600" />
<output>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="210" name="self.model.model.decoder.layers.0.encoder_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="211" name="Constant_985969" type="Const" version="opset1">
<data element_type="i64" shape="2" offset="851200" size="16" />
<output>
<port id="0" precision="I64">
<dim>2</dim>
</port>
</output>
</layer>
<layer id="212" name="Reshape_985970" type="Reshape" version="opset1">
<data special_zero="false" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="I64">
<dim>2</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="213" name="self.model.model.decoder.layers.0.encoder_attn.q_proj.weight/fq_weights_1/convert" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="214" name="__module.model.model.decoder.layers.0.encoder_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="215" name="Constant_34967" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1280" offset="73118406" size="5120" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="216" name="__module.model.model.decoder.layers.0.encoder_attn.q_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="175">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="217" name="Constant_35411" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="69693042" size="32" />
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="218" name="__module.model.model.decoder.layers.0.encoder_attn/aten::view/Reshape" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="177,query_states.5">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="219" name="__module.model.model.decoder.layers.0.encoder_attn/aten::transpose/Constant" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="856368" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="220" name="__module.model.model.decoder.layers.0.encoder_attn/aten::transpose/Transpose" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="178">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="221" name="self.model.model.decoder.layers.0.encoder_attn.k_proj.weight" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 128" offset="73123526" size="819200" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="222" name="Convert_964466" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="223" name="self.model.model.decoder.layers.0.encoder_attn.k_proj.weight/zero_point" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 1" offset="73942726" size="6400" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="224" name="Convert_964469" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="225" name="self.model.model.decoder.layers.0.encoder_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="226" name="self.model.model.decoder.layers.0.encoder_attn.k_proj.weight/scale" type="Const" version="opset1">
<data element_type="f16" shape="1280, 10, 1" offset="73949126" size="25600" />
<output>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="227" name="self.model.model.decoder.layers.0.encoder_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="228" name="Constant_964474" type="Const" version="opset1">
<data element_type="i64" shape="2" offset="851200" size="16" />
<output>
<port id="0" precision="I64">
<dim>2</dim>
</port>
</output>
</layer>
<layer id="229" name="Reshape_964475" type="Reshape" version="opset1">
<data special_zero="false" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="I64">
<dim>2</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="230" name="self.model.model.decoder.layers.0.encoder_attn.k_proj.weight/fq_weights_1/convert" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="231" name="__module.model.model.decoder.layers.0.encoder_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>-1</dim>
</port>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="181">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="232" name="__module.model.model.decoder.layers.0.encoder_attn/aten::view/Reshape_1" type="Reshape" version="opset1">
<data special_zero="false" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="183,key_states.5">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="233" name="__module.model.model.decoder.layers.0.encoder_attn/aten::transpose/Constant_1" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="856368" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="234" name="__module.model.model.decoder.layers.0.encoder_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="present.0.encoder.key">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="235" name="self.model.model.decoder.layers.0.encoder_attn.v_proj.weight" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 128" offset="73974726" size="819200" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="236" name="Convert_960167" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="237" name="self.model.model.decoder.layers.0.encoder_attn.v_proj.weight/zero_point" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 1" offset="74793926" size="6400" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="238" name="Convert_960170" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="239" name="self.model.model.decoder.layers.0.encoder_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="240" name="self.model.model.decoder.layers.0.encoder_attn.v_proj.weight/scale" type="Const" version="opset1">
<data element_type="f16" shape="1280, 10, 1" offset="74800326" size="25600" />
<output>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="241" name="self.model.model.decoder.layers.0.encoder_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="242" name="Constant_960175" type="Const" version="opset1">
<data element_type="i64" shape="2" offset="851200" size="16" />
<output>
<port id="0" precision="I64">
<dim>2</dim>
</port>
</output>
</layer>
<layer id="243" name="Reshape_960176" type="Reshape" version="opset1">
<data special_zero="false" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="I64">
<dim>2</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="244" name="self.model.model.decoder.layers.0.encoder_attn.v_proj.weight/fq_weights_1/convert" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="245" name="__module.model.model.decoder.layers.0.encoder_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>-1</dim>
</port>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="246" name="Constant_34968" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1280" offset="74825926" size="5120" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="247" name="__module.model.model.decoder.layers.0.encoder_attn.v_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="186">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="248" name="__module.model.model.decoder.layers.0.encoder_attn/aten::view/Reshape_2" type="Reshape" version="opset1">
<data special_zero="false" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="188,value_states.5">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="249" name="__module.model.model.decoder.layers.0.encoder_attn/aten::transpose/Constant_2" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="856368" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="250" name="__module.model.model.decoder.layers.0.encoder_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="present.0.encoder.value">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="251" name="__module.model.model.decoder.layers.0.encoder_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13">
<data causal="false" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</input>
<output>
<port id="3" precision="FP32" names="193,attn_output.5">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="252" name="__module.model.model.decoder.layers.0.encoder_attn/aten::transpose/Constant_3" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="856368" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="253" name="__module.model.model.decoder.layers.0.encoder_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="194,attn_output.7">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="254" name="Constant_35412" type="Const" version="opset1">
<data element_type="i64" shape="3" offset="71400622" size="24" />
<output>
<port id="0" precision="I64">
<dim>3</dim>
</port>
</output>
</layer>
<layer id="255" name="__module.model.model.decoder.layers.0.encoder_attn/aten::reshape/Reshape" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
<port id="1" precision="I64">
<dim>3</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="196,input.15">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="256" name="self.model.model.decoder.layers.0.encoder_attn.out_proj.weight" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 128" offset="74831046" size="819200" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="257" name="Convert_990260" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="258" name="self.model.model.decoder.layers.0.encoder_attn.out_proj.weight/zero_point" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 1" offset="75650246" size="6400" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="259" name="Convert_990263" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="260" name="self.model.model.decoder.layers.0.encoder_attn.out_proj.weight/zero_point/subtract" type="Subtract" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="261" name="self.model.model.decoder.layers.0.encoder_attn.out_proj.weight/scale" type="Const" version="opset1">
<data element_type="f16" shape="1280, 10, 1" offset="75656646" size="25600" />
<output>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="262" name="self.model.model.decoder.layers.0.encoder_attn.out_proj.weight/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="263" name="Constant_990268" type="Const" version="opset1">
<data element_type="i64" shape="2" offset="851200" size="16" />
<output>
<port id="0" precision="I64">
<dim>2</dim>
</port>
</output>
</layer>
<layer id="264" name="Reshape_990269" type="Reshape" version="opset1">
<data special_zero="false" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="I64">
<dim>2</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="265" name="self.model.model.decoder.layers.0.encoder_attn.out_proj.weight/fq_weights_1/convert" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="266" name="__module.model.model.decoder.layers.0.encoder_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="267" name="Constant_34969" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1280" offset="75682246" size="5120" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="268" name="__module.model.model.decoder.layers.0.encoder_attn.out_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="199,201,input.17">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="269" name="__module.model.model.decoder.layers.0/aten::add/Add_1" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="205,input.19">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="270" name="__module.model.model.decoder.layers.0.final_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1">
<data element_type="i32" shape="1" offset="68826478" size="4" />
<output>
<port id="0" precision="I32">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="271" name="__module.model.model.decoder.layers.0.final_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6">
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="I32">
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="272" name="Constant_34970" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1280" offset="75687366" size="5120" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="273" name="__module.model.model.decoder.layers.0.final_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="274" name="Constant_34971" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1280" offset="75692486" size="5120" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="275" name="__module.model.model.decoder.layers.0.final_layer_norm/aten::layer_norm/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="209,input.21">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="276" name="self.model.model.decoder.layers.0.fc1.weight" type="Const" version="opset1">
<data element_type="u4" shape="5120, 10, 128" offset="75697606" size="3276800" />
<output>
<port id="0" precision="U4">
<dim>5120</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="277" name="Convert_899981" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>5120</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>5120</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="278" name="self.model.model.decoder.layers.0.fc1.weight/zero_point" type="Const" version="opset1">
<data element_type="u4" shape="5120, 10, 1" offset="78974406" size="25600" />
<output>
<port id="0" precision="U4">
<dim>5120</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="279" name="Convert_899984" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>5120</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>5120</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="280" name="self.model.model.decoder.layers.0.fc1.weight/zero_point/subtract" type="Subtract" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>5120</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>5120</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>5120</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="281" name="self.model.model.decoder.layers.0.fc1.weight/scale" type="Const" version="opset1">
<data element_type="f16" shape="5120, 10, 1" offset="79000006" size="102400" />
<output>
<port id="0" precision="FP16">
<dim>5120</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="282" name="self.model.model.decoder.layers.0.fc1.weight/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>5120</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>5120</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>5120</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="283" name="Constant_899989" type="Const" version="opset1">
<data element_type="i64" shape="2" offset="79102406" size="16" />
<output>
<port id="0" precision="I64">
<dim>2</dim>
</port>
</output>
</layer>
<layer id="284" name="Reshape_899990" type="Reshape" version="opset1">
<data special_zero="false" />
<input>
<port id="0" precision="FP16">
<dim>5120</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="I64">
<dim>2</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>5120</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="285" name="self.model.model.decoder.layers.0.fc1.weight/fq_weights_1/convert" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="FP16">
<dim>5120</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>5120</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="286" name="__module.model.model.decoder.layers.0.fc1/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>5120</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>5120</dim>
</port>
</output>
</layer>
<layer id="287" name="Constant_34972" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 5120" offset="79102422" size="20480" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>5120</dim>
</port>
</output>
</layer>
<layer id="288" name="__module.model.model.decoder.layers.0.fc1/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>5120</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>5120</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="212,input.23">
<dim>-1</dim>
<dim>-1</dim>
<dim>5120</dim>
</port>
</output>
</layer>
<layer id="289" name="__module.model.model.decoder.layers.0.activation_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
<data approximation_mode="ERF" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>5120</dim>
</port>
</input>
<output>
<port id="1" precision="FP32" names="213,input.25">
<dim>-1</dim>
<dim>-1</dim>
<dim>5120</dim>
</port>
</output>
</layer>
<layer id="290" name="self.model.model.decoder.layers.0.fc2.weight" type="Const" version="opset1">
<data element_type="u4" shape="1280, 40, 128" offset="79122902" size="3276800" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>40</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="291" name="Convert_904280" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>40</dim>
<dim>128</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>40</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="292" name="self.model.model.decoder.layers.0.fc2.weight/zero_point" type="Const" version="opset1">
<data element_type="u4" shape="1280, 40, 1" offset="82399702" size="25600" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>40</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="293" name="Convert_904283" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>40</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>40</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="294" name="self.model.model.decoder.layers.0.fc2.weight/zero_point/subtract" type="Subtract" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>40</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>40</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>40</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="295" name="self.model.model.decoder.layers.0.fc2.weight/scale" type="Const" version="opset1">
<data element_type="f16" shape="1280, 40, 1" offset="82425302" size="102400" />
<output>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>40</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="296" name="self.model.model.decoder.layers.0.fc2.weight/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>40</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>40</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>40</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="297" name="Constant_904288" type="Const" version="opset1">
<data element_type="i64" shape="2" offset="82527702" size="16" />
<output>
<port id="0" precision="I64">
<dim>2</dim>
</port>
</output>
</layer>
<layer id="298" name="Reshape_904289" type="Reshape" version="opset1">
<data special_zero="false" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>40</dim>
<dim>128</dim>
</port>
<port id="1" precision="I64">
<dim>2</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>5120</dim>
</port>
</output>
</layer>
<layer id="299" name="self.model.model.decoder.layers.0.fc2.weight/fq_weights_1/convert" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>5120</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>5120</dim>
</port>
</output>
</layer>
<layer id="300" name="__module.model.model.decoder.layers.0.fc2/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>5120</dim>
</port>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>5120</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="301" name="Constant_34973" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1280" offset="82527718" size="5120" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="302" name="__module.model.model.decoder.layers.0.fc2/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="217,input.29">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="303" name="__module.model.model.decoder.layers.0/aten::add/Add_2" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="219,221,input.31">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="304" name="__module.model.model.decoder.layers.1.self_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1">
<data element_type="i32" shape="1" offset="68826478" size="4" />
<output>
<port id="0" precision="I32">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="305" name="__module.model.model.decoder.layers.1.self_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6">
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="I32">
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="306" name="Constant_34974" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1280" offset="82532838" size="5120" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="307" name="__module.model.model.decoder.layers.1.self_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="308" name="Constant_34975" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1280" offset="82537958" size="5120" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="309" name="__module.model.model.decoder.layers.1.self_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="236,hidden_states.11">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="310" name="self.model.model.decoder.layers.1.self_attn.q_proj.weight" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 128" offset="82543078" size="819200" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="311" name="Convert_1003157" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="312" name="self.model.model.decoder.layers.1.self_attn.q_proj.weight/zero_point" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 1" offset="83362278" size="6400" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="313" name="Convert_1003160" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="314" name="self.model.model.decoder.layers.1.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="315" name="self.model.model.decoder.layers.1.self_attn.q_proj.weight/scale" type="Const" version="opset1">
<data element_type="f16" shape="1280, 10, 1" offset="83368678" size="25600" />
<output>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="316" name="self.model.model.decoder.layers.1.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="317" name="Constant_1003165" type="Const" version="opset1">
<data element_type="i64" shape="2" offset="851200" size="16" />
<output>
<port id="0" precision="I64">
<dim>2</dim>
</port>
</output>
</layer>
<layer id="318" name="Reshape_1003166" type="Reshape" version="opset1">
<data special_zero="false" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="I64">
<dim>2</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="319" name="self.model.model.decoder.layers.1.self_attn.q_proj.weight/fq_weights_1/convert" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="320" name="__module.model.model.decoder.layers.1.self_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="321" name="Constant_34976" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1280" offset="83394278" size="5120" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="322" name="__module.model.model.decoder.layers.1.self_attn.q_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="245">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="323" name="Constant_35413" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="69693042" size="32" />
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="324" name="__module.model.model.decoder.layers.1.self_attn/aten::view/Reshape" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="247,query_states.9">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="325" name="__module.model.model.decoder.layers.1.self_attn/aten::transpose/Constant" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="856368" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="326" name="__module.model.model.decoder.layers.1.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="248">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="327" name="self.model.model.decoder.layers.1.self_attn.k_proj.weight" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 128" offset="83399398" size="819200" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="328" name="Convert_998858" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="329" name="self.model.model.decoder.layers.1.self_attn.k_proj.weight/zero_point" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 1" offset="84218598" size="6400" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="330" name="Convert_998861" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="331" name="self.model.model.decoder.layers.1.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="332" name="self.model.model.decoder.layers.1.self_attn.k_proj.weight/scale" type="Const" version="opset1">
<data element_type="f16" shape="1280, 10, 1" offset="84224998" size="25600" />
<output>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="333" name="self.model.model.decoder.layers.1.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="334" name="Constant_998866" type="Const" version="opset1">
<data element_type="i64" shape="2" offset="851200" size="16" />
<output>
<port id="0" precision="I64">
<dim>2</dim>
</port>
</output>
</layer>
<layer id="335" name="Reshape_998867" type="Reshape" version="opset1">
<data special_zero="false" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="I64">
<dim>2</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="336" name="self.model.model.decoder.layers.1.self_attn.k_proj.weight/fq_weights_1/convert" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="337" name="__module.model.model.decoder.layers.1.self_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="251">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="338" name="Constant_35414" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="69693042" size="32" />
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="339" name="__module.model.model.decoder.layers.1.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="253,key_states.9">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="340" name="__module.model.model.decoder.layers.1.self_attn/aten::transpose/Constant_1" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="856368" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="341" name="__module.model.model.decoder.layers.1.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="present.1.decoder.key">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="342" name="self.model.model.decoder.layers.1.self_attn.v_proj.weight" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 128" offset="84250598" size="819200" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="343" name="Convert_994559" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="344" name="self.model.model.decoder.layers.1.self_attn.v_proj.weight/zero_point" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 1" offset="85069798" size="6400" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="345" name="Convert_994562" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="346" name="self.model.model.decoder.layers.1.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="347" name="self.model.model.decoder.layers.1.self_attn.v_proj.weight/scale" type="Const" version="opset1">
<data element_type="f16" shape="1280, 10, 1" offset="85076198" size="25600" />
<output>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="348" name="self.model.model.decoder.layers.1.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="349" name="Constant_994567" type="Const" version="opset1">
<data element_type="i64" shape="2" offset="851200" size="16" />
<output>
<port id="0" precision="I64">
<dim>2</dim>
</port>
</output>
</layer>
<layer id="350" name="Reshape_994568" type="Reshape" version="opset1">
<data special_zero="false" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="I64">
<dim>2</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="351" name="self.model.model.decoder.layers.1.self_attn.v_proj.weight/fq_weights_1/convert" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="352" name="__module.model.model.decoder.layers.1.self_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="353" name="Constant_34977" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1280" offset="85101798" size="5120" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="354" name="__module.model.model.decoder.layers.1.self_attn.v_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="256">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="355" name="Constant_35415" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="69693042" size="32" />
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="356" name="__module.model.model.decoder.layers.1.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="258,value_states.9">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="357" name="__module.model.model.decoder.layers.1.self_attn/aten::transpose/Constant_2" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="856368" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="358" name="__module.model.model.decoder.layers.1.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="present.1.decoder.value">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="359" name="__module.model.model.decoder.layers.1.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13">
<data causal="false" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
<port id="3" precision="FP32">
<dim>-1</dim>
<dim>1</dim>
<dim>-1</dim>
<dim>-1</dim>
</port>
</input>
<output>
<port id="4" precision="FP32" names="268,attn_output.9">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="360" name="__module.model.model.decoder.layers.1.self_attn/aten::transpose/Constant_3" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="856368" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="361" name="__module.model.model.decoder.layers.1.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="269,attn_output.11">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="362" name="Constant_35416" type="Const" version="opset1">
<data element_type="i64" shape="3" offset="71400622" size="24" />
<output>
<port id="0" precision="I64">
<dim>3</dim>
</port>
</output>
</layer>
<layer id="363" name="__module.model.model.decoder.layers.1.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
<port id="1" precision="I64">
<dim>3</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="271,input.33">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="364" name="self.model.model.decoder.layers.1.self_attn.out_proj.weight" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 128" offset="85106918" size="819200" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="365" name="Convert_1007456" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="366" name="self.model.model.decoder.layers.1.self_attn.out_proj.weight/zero_point" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 1" offset="85926118" size="6400" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="367" name="Convert_1007459" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="368" name="self.model.model.decoder.layers.1.self_attn.out_proj.weight/zero_point/subtract" type="Subtract" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="369" name="self.model.model.decoder.layers.1.self_attn.out_proj.weight/scale" type="Const" version="opset1">
<data element_type="f16" shape="1280, 10, 1" offset="85932518" size="25600" />
<output>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="370" name="self.model.model.decoder.layers.1.self_attn.out_proj.weight/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="371" name="Constant_1007464" type="Const" version="opset1">
<data element_type="i64" shape="2" offset="851200" size="16" />
<output>
<port id="0" precision="I64">
<dim>2</dim>
</port>
</output>
</layer>
<layer id="372" name="Reshape_1007465" type="Reshape" version="opset1">
<data special_zero="false" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="I64">
<dim>2</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="373" name="self.model.model.decoder.layers.1.self_attn.out_proj.weight/fq_weights_1/convert" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="374" name="__module.model.model.decoder.layers.1.self_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="375" name="Constant_34978" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1280" offset="85958118" size="5120" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="376" name="__module.model.model.decoder.layers.1.self_attn.out_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="274,276,input.35">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="377" name="__module.model.model.decoder.layers.1/aten::add/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="280,input.37">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="378" name="__module.model.model.decoder.layers.1.encoder_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1">
<data element_type="i32" shape="1" offset="68826478" size="4" />
<output>
<port id="0" precision="I32">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="379" name="__module.model.model.decoder.layers.1.encoder_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6">
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="I32">
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="380" name="Constant_34979" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1280" offset="85963238" size="5120" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="381" name="__module.model.model.decoder.layers.1.encoder_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="382" name="Constant_34980" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1280" offset="85968358" size="5120" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="383" name="__module.model.model.decoder.layers.1.encoder_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="284,hidden_states.15">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="384" name="self.model.model.decoder.layers.1.encoder_attn.q_proj.weight" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 128" offset="85973478" size="819200" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="385" name="Convert_1011755" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="386" name="self.model.model.decoder.layers.1.encoder_attn.q_proj.weight/zero_point" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 1" offset="86792678" size="6400" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="387" name="Convert_1011758" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="388" name="self.model.model.decoder.layers.1.encoder_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="389" name="self.model.model.decoder.layers.1.encoder_attn.q_proj.weight/scale" type="Const" version="opset1">
<data element_type="f16" shape="1280, 10, 1" offset="86799078" size="25600" />
<output>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="390" name="self.model.model.decoder.layers.1.encoder_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="391" name="Constant_1011763" type="Const" version="opset1">
<data element_type="i64" shape="2" offset="851200" size="16" />
<output>
<port id="0" precision="I64">
<dim>2</dim>
</port>
</output>
</layer>
<layer id="392" name="Reshape_1011764" type="Reshape" version="opset1">
<data special_zero="false" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="I64">
<dim>2</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="393" name="self.model.model.decoder.layers.1.encoder_attn.q_proj.weight/fq_weights_1/convert" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="394" name="__module.model.model.decoder.layers.1.encoder_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="395" name="Constant_34981" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1280" offset="86824678" size="5120" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="396" name="__module.model.model.decoder.layers.1.encoder_attn.q_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="293">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="397" name="Constant_35417" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="69693042" size="32" />
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="398" name="__module.model.model.decoder.layers.1.encoder_attn/aten::view/Reshape" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="295,query_states.13">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="399" name="__module.model.model.decoder.layers.1.encoder_attn/aten::transpose/Constant" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="856368" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="400" name="__module.model.model.decoder.layers.1.encoder_attn/aten::transpose/Transpose" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="296">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="401" name="self.model.model.decoder.layers.1.encoder_attn.k_proj.weight" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 128" offset="86829798" size="819200" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="402" name="Convert_955868" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="403" name="self.model.model.decoder.layers.1.encoder_attn.k_proj.weight/zero_point" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 1" offset="87648998" size="6400" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="404" name="Convert_955871" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="405" name="self.model.model.decoder.layers.1.encoder_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="406" name="self.model.model.decoder.layers.1.encoder_attn.k_proj.weight/scale" type="Const" version="opset1">
<data element_type="f16" shape="1280, 10, 1" offset="87655398" size="25600" />
<output>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="407" name="self.model.model.decoder.layers.1.encoder_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="408" name="Constant_955876" type="Const" version="opset1">
<data element_type="i64" shape="2" offset="851200" size="16" />
<output>
<port id="0" precision="I64">
<dim>2</dim>
</port>
</output>
</layer>
<layer id="409" name="Reshape_955877" type="Reshape" version="opset1">
<data special_zero="false" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="I64">
<dim>2</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="410" name="self.model.model.decoder.layers.1.encoder_attn.k_proj.weight/fq_weights_1/convert" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="411" name="__module.model.model.decoder.layers.1.encoder_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>-1</dim>
</port>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="299">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="412" name="__module.model.model.decoder.layers.1.encoder_attn/aten::view/Reshape_1" type="Reshape" version="opset1">
<data special_zero="false" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="301,key_states.13">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="413" name="__module.model.model.decoder.layers.1.encoder_attn/aten::transpose/Constant_1" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="856368" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="414" name="__module.model.model.decoder.layers.1.encoder_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="present.1.encoder.key">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="415" name="self.model.model.decoder.layers.1.encoder_attn.v_proj.weight" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 128" offset="87680998" size="819200" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="416" name="Convert_951569" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="417" name="self.model.model.decoder.layers.1.encoder_attn.v_proj.weight/zero_point" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 1" offset="88500198" size="6400" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="418" name="Convert_951572" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="419" name="self.model.model.decoder.layers.1.encoder_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="420" name="self.model.model.decoder.layers.1.encoder_attn.v_proj.weight/scale" type="Const" version="opset1">
<data element_type="f16" shape="1280, 10, 1" offset="88506598" size="25600" />
<output>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="421" name="self.model.model.decoder.layers.1.encoder_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="422" name="Constant_951577" type="Const" version="opset1">
<data element_type="i64" shape="2" offset="851200" size="16" />
<output>
<port id="0" precision="I64">
<dim>2</dim>
</port>
</output>
</layer>
<layer id="423" name="Reshape_951578" type="Reshape" version="opset1">
<data special_zero="false" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="I64">
<dim>2</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="424" name="self.model.model.decoder.layers.1.encoder_attn.v_proj.weight/fq_weights_1/convert" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="425" name="__module.model.model.decoder.layers.1.encoder_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>-1</dim>
</port>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="426" name="Constant_34982" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1280" offset="88532198" size="5120" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="427" name="__module.model.model.decoder.layers.1.encoder_attn.v_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="304">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="428" name="__module.model.model.decoder.layers.1.encoder_attn/aten::view/Reshape_2" type="Reshape" version="opset1">
<data special_zero="false" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="306,value_states.13">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="429" name="__module.model.model.decoder.layers.1.encoder_attn/aten::transpose/Constant_2" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="856368" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="430" name="__module.model.model.decoder.layers.1.encoder_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="present.1.encoder.value">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="431" name="__module.model.model.decoder.layers.1.encoder_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13">
<data causal="false" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</input>
<output>
<port id="3" precision="FP32" names="311,attn_output.13">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="432" name="__module.model.model.decoder.layers.1.encoder_attn/aten::transpose/Constant_3" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="856368" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="433" name="__module.model.model.decoder.layers.1.encoder_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="312,attn_output.15">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="434" name="Constant_35418" type="Const" version="opset1">
<data element_type="i64" shape="3" offset="71400622" size="24" />
<output>
<port id="0" precision="I64">
<dim>3</dim>
</port>
</output>
</layer>
<layer id="435" name="__module.model.model.decoder.layers.1.encoder_attn/aten::reshape/Reshape" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
<port id="1" precision="I64">
<dim>3</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="314,input.39">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="436" name="self.model.model.decoder.layers.1.encoder_attn.out_proj.weight" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 128" offset="88537318" size="819200" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="437" name="Convert_1016054" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="438" name="self.model.model.decoder.layers.1.encoder_attn.out_proj.weight/zero_point" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 1" offset="89356518" size="6400" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="439" name="Convert_1016057" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="440" name="self.model.model.decoder.layers.1.encoder_attn.out_proj.weight/zero_point/subtract" type="Subtract" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="441" name="self.model.model.decoder.layers.1.encoder_attn.out_proj.weight/scale" type="Const" version="opset1">
<data element_type="f16" shape="1280, 10, 1" offset="89362918" size="25600" />
<output>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="442" name="self.model.model.decoder.layers.1.encoder_attn.out_proj.weight/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="443" name="Constant_1016062" type="Const" version="opset1">
<data element_type="i64" shape="2" offset="851200" size="16" />
<output>
<port id="0" precision="I64">
<dim>2</dim>
</port>
</output>
</layer>
<layer id="444" name="Reshape_1016063" type="Reshape" version="opset1">
<data special_zero="false" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="I64">
<dim>2</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="445" name="self.model.model.decoder.layers.1.encoder_attn.out_proj.weight/fq_weights_1/convert" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="446" name="__module.model.model.decoder.layers.1.encoder_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="447" name="Constant_34983" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1280" offset="89388518" size="5120" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="448" name="__module.model.model.decoder.layers.1.encoder_attn.out_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="317,319,input.41">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="449" name="__module.model.model.decoder.layers.1/aten::add/Add_1" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="323,input.43">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="450" name="__module.model.model.decoder.layers.1.final_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1">
<data element_type="i32" shape="1" offset="68826478" size="4" />
<output>
<port id="0" precision="I32">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="451" name="__module.model.model.decoder.layers.1.final_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6">
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="I32">
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="452" name="Constant_34984" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1280" offset="89393638" size="5120" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="453" name="__module.model.model.decoder.layers.1.final_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="454" name="Constant_34985" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1280" offset="89398758" size="5120" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="455" name="__module.model.model.decoder.layers.1.final_layer_norm/aten::layer_norm/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="327,input.45">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="456" name="self.model.model.decoder.layers.1.fc1.weight" type="Const" version="opset1">
<data element_type="u4" shape="5120, 10, 128" offset="89403878" size="3276800" />
<output>
<port id="0" precision="U4">
<dim>5120</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="457" name="Convert_908579" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>5120</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>5120</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="458" name="self.model.model.decoder.layers.1.fc1.weight/zero_point" type="Const" version="opset1">
<data element_type="u4" shape="5120, 10, 1" offset="92680678" size="25600" />
<output>
<port id="0" precision="U4">
<dim>5120</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="459" name="Convert_908582" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>5120</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>5120</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="460" name="self.model.model.decoder.layers.1.fc1.weight/zero_point/subtract" type="Subtract" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>5120</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>5120</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>5120</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="461" name="self.model.model.decoder.layers.1.fc1.weight/scale" type="Const" version="opset1">
<data element_type="f16" shape="5120, 10, 1" offset="92706278" size="102400" />
<output>
<port id="0" precision="FP16">
<dim>5120</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="462" name="self.model.model.decoder.layers.1.fc1.weight/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>5120</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>5120</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>5120</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="463" name="Constant_908587" type="Const" version="opset1">
<data element_type="i64" shape="2" offset="79102406" size="16" />
<output>
<port id="0" precision="I64">
<dim>2</dim>
</port>
</output>
</layer>
<layer id="464" name="Reshape_908588" type="Reshape" version="opset1">
<data special_zero="false" />
<input>
<port id="0" precision="FP16">
<dim>5120</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="I64">
<dim>2</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>5120</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="465" name="self.model.model.decoder.layers.1.fc1.weight/fq_weights_1/convert" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="FP16">
<dim>5120</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>5120</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="466" name="__module.model.model.decoder.layers.1.fc1/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>5120</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>5120</dim>
</port>
</output>
</layer>
<layer id="467" name="Constant_34986" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 5120" offset="92808678" size="20480" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>5120</dim>
</port>
</output>
</layer>
<layer id="468" name="__module.model.model.decoder.layers.1.fc1/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>5120</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>5120</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="330,input.47">
<dim>-1</dim>
<dim>-1</dim>
<dim>5120</dim>
</port>
</output>
</layer>
<layer id="469" name="__module.model.model.decoder.layers.1.activation_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
<data approximation_mode="ERF" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>5120</dim>
</port>
</input>
<output>
<port id="1" precision="FP32" names="331,input.49">
<dim>-1</dim>
<dim>-1</dim>
<dim>5120</dim>
</port>
</output>
</layer>
<layer id="470" name="self.model.model.decoder.layers.1.fc2.weight" type="Const" version="opset1">
<data element_type="u4" shape="1280, 40, 128" offset="92829158" size="3276800" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>40</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="471" name="Convert_912878" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>40</dim>
<dim>128</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>40</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="472" name="self.model.model.decoder.layers.1.fc2.weight/zero_point" type="Const" version="opset1">
<data element_type="u4" shape="1280, 40, 1" offset="96105958" size="25600" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>40</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="473" name="Convert_912881" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>40</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>40</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="474" name="self.model.model.decoder.layers.1.fc2.weight/zero_point/subtract" type="Subtract" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>40</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>40</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>40</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="475" name="self.model.model.decoder.layers.1.fc2.weight/scale" type="Const" version="opset1">
<data element_type="f16" shape="1280, 40, 1" offset="96131558" size="102400" />
<output>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>40</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="476" name="self.model.model.decoder.layers.1.fc2.weight/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>40</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>40</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>40</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="477" name="Constant_912886" type="Const" version="opset1">
<data element_type="i64" shape="2" offset="82527702" size="16" />
<output>
<port id="0" precision="I64">
<dim>2</dim>
</port>
</output>
</layer>
<layer id="478" name="Reshape_912887" type="Reshape" version="opset1">
<data special_zero="false" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>40</dim>
<dim>128</dim>
</port>
<port id="1" precision="I64">
<dim>2</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>5120</dim>
</port>
</output>
</layer>
<layer id="479" name="self.model.model.decoder.layers.1.fc2.weight/fq_weights_1/convert" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>5120</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>5120</dim>
</port>
</output>
</layer>
<layer id="480" name="__module.model.model.decoder.layers.1.fc2/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>5120</dim>
</port>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>5120</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="481" name="Constant_34987" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1280" offset="96233958" size="5120" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="482" name="__module.model.model.decoder.layers.1.fc2/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="335,input.53">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="483" name="__module.model.model.decoder.layers.1/aten::add/Add_2" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="337,339,input.55">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="484" name="__module.model.model.decoder.layers.2.self_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1">
<data element_type="i32" shape="1" offset="68826478" size="4" />
<output>
<port id="0" precision="I32">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="485" name="__module.model.model.decoder.layers.2.self_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6">
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="I32">
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="486" name="Constant_34988" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1280" offset="96239078" size="5120" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="487" name="__module.model.model.decoder.layers.2.self_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="488" name="Constant_34989" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1280" offset="96244198" size="5120" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="489" name="__module.model.model.decoder.layers.2.self_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="354,hidden_states.21">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="490" name="self.model.model.decoder.layers.2.self_attn.q_proj.weight" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 128" offset="96249318" size="819200" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="491" name="Convert_1028951" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="492" name="self.model.model.decoder.layers.2.self_attn.q_proj.weight/zero_point" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 1" offset="97068518" size="6400" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="493" name="Convert_1028954" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="494" name="self.model.model.decoder.layers.2.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="495" name="self.model.model.decoder.layers.2.self_attn.q_proj.weight/scale" type="Const" version="opset1">
<data element_type="f16" shape="1280, 10, 1" offset="97074918" size="25600" />
<output>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="496" name="self.model.model.decoder.layers.2.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="497" name="Constant_1028959" type="Const" version="opset1">
<data element_type="i64" shape="2" offset="851200" size="16" />
<output>
<port id="0" precision="I64">
<dim>2</dim>
</port>
</output>
</layer>
<layer id="498" name="Reshape_1028960" type="Reshape" version="opset1">
<data special_zero="false" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="I64">
<dim>2</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="499" name="self.model.model.decoder.layers.2.self_attn.q_proj.weight/fq_weights_1/convert" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="500" name="__module.model.model.decoder.layers.2.self_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="501" name="Constant_34990" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1280" offset="97100518" size="5120" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="502" name="__module.model.model.decoder.layers.2.self_attn.q_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="363">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="503" name="Constant_35419" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="69693042" size="32" />
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="504" name="__module.model.model.decoder.layers.2.self_attn/aten::view/Reshape" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="365,query_states.17">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="505" name="__module.model.model.decoder.layers.2.self_attn/aten::transpose/Constant" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="856368" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="506" name="__module.model.model.decoder.layers.2.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="366">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="507" name="self.model.model.decoder.layers.2.self_attn.k_proj.weight" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 128" offset="97105638" size="819200" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="508" name="Convert_1024652" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="509" name="self.model.model.decoder.layers.2.self_attn.k_proj.weight/zero_point" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 1" offset="97924838" size="6400" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="510" name="Convert_1024655" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="511" name="self.model.model.decoder.layers.2.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="512" name="self.model.model.decoder.layers.2.self_attn.k_proj.weight/scale" type="Const" version="opset1">
<data element_type="f16" shape="1280, 10, 1" offset="97931238" size="25600" />
<output>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="513" name="self.model.model.decoder.layers.2.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="514" name="Constant_1024660" type="Const" version="opset1">
<data element_type="i64" shape="2" offset="851200" size="16" />
<output>
<port id="0" precision="I64">
<dim>2</dim>
</port>
</output>
</layer>
<layer id="515" name="Reshape_1024661" type="Reshape" version="opset1">
<data special_zero="false" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="I64">
<dim>2</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="516" name="self.model.model.decoder.layers.2.self_attn.k_proj.weight/fq_weights_1/convert" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="517" name="__module.model.model.decoder.layers.2.self_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="369">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="518" name="Constant_35420" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="69693042" size="32" />
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="519" name="__module.model.model.decoder.layers.2.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="371,key_states.17">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="520" name="__module.model.model.decoder.layers.2.self_attn/aten::transpose/Constant_1" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="856368" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="521" name="__module.model.model.decoder.layers.2.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="present.2.decoder.key">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="522" name="self.model.model.decoder.layers.2.self_attn.v_proj.weight" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 128" offset="97956838" size="819200" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="523" name="Convert_1020353" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="524" name="self.model.model.decoder.layers.2.self_attn.v_proj.weight/zero_point" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 1" offset="98776038" size="6400" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="525" name="Convert_1020356" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="526" name="self.model.model.decoder.layers.2.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="527" name="self.model.model.decoder.layers.2.self_attn.v_proj.weight/scale" type="Const" version="opset1">
<data element_type="f16" shape="1280, 10, 1" offset="98782438" size="25600" />
<output>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="528" name="self.model.model.decoder.layers.2.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="529" name="Constant_1020361" type="Const" version="opset1">
<data element_type="i64" shape="2" offset="851200" size="16" />
<output>
<port id="0" precision="I64">
<dim>2</dim>
</port>
</output>
</layer>
<layer id="530" name="Reshape_1020362" type="Reshape" version="opset1">
<data special_zero="false" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="I64">
<dim>2</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="531" name="self.model.model.decoder.layers.2.self_attn.v_proj.weight/fq_weights_1/convert" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="532" name="__module.model.model.decoder.layers.2.self_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="533" name="Constant_34991" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1280" offset="98808038" size="5120" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="534" name="__module.model.model.decoder.layers.2.self_attn.v_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="374">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="535" name="Constant_35421" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="69693042" size="32" />
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="536" name="__module.model.model.decoder.layers.2.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="376,value_states.17">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="537" name="__module.model.model.decoder.layers.2.self_attn/aten::transpose/Constant_2" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="856368" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="538" name="__module.model.model.decoder.layers.2.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="present.2.decoder.value">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="539" name="__module.model.model.decoder.layers.2.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13">
<data causal="false" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
<port id="3" precision="FP32">
<dim>-1</dim>
<dim>1</dim>
<dim>-1</dim>
<dim>-1</dim>
</port>
</input>
<output>
<port id="4" precision="FP32" names="386,attn_output.17">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="540" name="__module.model.model.decoder.layers.2.self_attn/aten::transpose/Constant_3" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="856368" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="541" name="__module.model.model.decoder.layers.2.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="387,attn_output.19">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="542" name="Constant_35422" type="Const" version="opset1">
<data element_type="i64" shape="3" offset="71400622" size="24" />
<output>
<port id="0" precision="I64">
<dim>3</dim>
</port>
</output>
</layer>
<layer id="543" name="__module.model.model.decoder.layers.2.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
<port id="1" precision="I64">
<dim>3</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="389,input.57">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="544" name="self.model.model.decoder.layers.2.self_attn.out_proj.weight" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 128" offset="98813158" size="819200" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="545" name="Convert_1033250" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="546" name="self.model.model.decoder.layers.2.self_attn.out_proj.weight/zero_point" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 1" offset="99632358" size="6400" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="547" name="Convert_1033253" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="548" name="self.model.model.decoder.layers.2.self_attn.out_proj.weight/zero_point/subtract" type="Subtract" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="549" name="self.model.model.decoder.layers.2.self_attn.out_proj.weight/scale" type="Const" version="opset1">
<data element_type="f16" shape="1280, 10, 1" offset="99638758" size="25600" />
<output>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="550" name="self.model.model.decoder.layers.2.self_attn.out_proj.weight/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="551" name="Constant_1033258" type="Const" version="opset1">
<data element_type="i64" shape="2" offset="851200" size="16" />
<output>
<port id="0" precision="I64">
<dim>2</dim>
</port>
</output>
</layer>
<layer id="552" name="Reshape_1033259" type="Reshape" version="opset1">
<data special_zero="false" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="I64">
<dim>2</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="553" name="self.model.model.decoder.layers.2.self_attn.out_proj.weight/fq_weights_1/convert" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="554" name="__module.model.model.decoder.layers.2.self_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="555" name="Constant_34992" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1280" offset="99664358" size="5120" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="556" name="__module.model.model.decoder.layers.2.self_attn.out_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="392,394,input.59">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="557" name="__module.model.model.decoder.layers.2/aten::add/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="398,input.61">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="558" name="__module.model.model.decoder.layers.2.encoder_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1">
<data element_type="i32" shape="1" offset="68826478" size="4" />
<output>
<port id="0" precision="I32">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="559" name="__module.model.model.decoder.layers.2.encoder_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6">
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="I32">
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="560" name="Constant_34993" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1280" offset="99669478" size="5120" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="561" name="__module.model.model.decoder.layers.2.encoder_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="562" name="Constant_34994" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1280" offset="99674598" size="5120" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="563" name="__module.model.model.decoder.layers.2.encoder_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="402,hidden_states.25">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="564" name="self.model.model.decoder.layers.2.encoder_attn.q_proj.weight" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 128" offset="99679718" size="819200" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="565" name="Convert_1037549" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="566" name="self.model.model.decoder.layers.2.encoder_attn.q_proj.weight/zero_point" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 1" offset="100498918" size="6400" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="567" name="Convert_1037552" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="568" name="self.model.model.decoder.layers.2.encoder_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="569" name="self.model.model.decoder.layers.2.encoder_attn.q_proj.weight/scale" type="Const" version="opset1">
<data element_type="f16" shape="1280, 10, 1" offset="100505318" size="25600" />
<output>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="570" name="self.model.model.decoder.layers.2.encoder_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="571" name="Constant_1037557" type="Const" version="opset1">
<data element_type="i64" shape="2" offset="851200" size="16" />
<output>
<port id="0" precision="I64">
<dim>2</dim>
</port>
</output>
</layer>
<layer id="572" name="Reshape_1037558" type="Reshape" version="opset1">
<data special_zero="false" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="I64">
<dim>2</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="573" name="self.model.model.decoder.layers.2.encoder_attn.q_proj.weight/fq_weights_1/convert" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="574" name="__module.model.model.decoder.layers.2.encoder_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="575" name="Constant_34995" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1280" offset="100530918" size="5120" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="576" name="__module.model.model.decoder.layers.2.encoder_attn.q_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="411">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="577" name="Constant_35423" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="69693042" size="32" />
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="578" name="__module.model.model.decoder.layers.2.encoder_attn/aten::view/Reshape" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="413,query_states.21">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="579" name="__module.model.model.decoder.layers.2.encoder_attn/aten::transpose/Constant" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="856368" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="580" name="__module.model.model.decoder.layers.2.encoder_attn/aten::transpose/Transpose" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="414">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="581" name="self.model.model.decoder.layers.2.encoder_attn.k_proj.weight" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 128" offset="100536038" size="819200" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="582" name="Convert_947270" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="583" name="self.model.model.decoder.layers.2.encoder_attn.k_proj.weight/zero_point" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 1" offset="101355238" size="6400" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="584" name="Convert_947273" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="585" name="self.model.model.decoder.layers.2.encoder_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="586" name="self.model.model.decoder.layers.2.encoder_attn.k_proj.weight/scale" type="Const" version="opset1">
<data element_type="f16" shape="1280, 10, 1" offset="101361638" size="25600" />
<output>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="587" name="self.model.model.decoder.layers.2.encoder_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="588" name="Constant_947278" type="Const" version="opset1">
<data element_type="i64" shape="2" offset="851200" size="16" />
<output>
<port id="0" precision="I64">
<dim>2</dim>
</port>
</output>
</layer>
<layer id="589" name="Reshape_947279" type="Reshape" version="opset1">
<data special_zero="false" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="I64">
<dim>2</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="590" name="self.model.model.decoder.layers.2.encoder_attn.k_proj.weight/fq_weights_1/convert" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="591" name="__module.model.model.decoder.layers.2.encoder_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>-1</dim>
</port>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="417">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="592" name="__module.model.model.decoder.layers.2.encoder_attn/aten::view/Reshape_1" type="Reshape" version="opset1">
<data special_zero="false" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="419,key_states.21">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="593" name="__module.model.model.decoder.layers.2.encoder_attn/aten::transpose/Constant_1" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="856368" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="594" name="__module.model.model.decoder.layers.2.encoder_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="present.2.encoder.key">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="595" name="self.model.model.decoder.layers.2.encoder_attn.v_proj.weight" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 128" offset="101387238" size="819200" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="596" name="Convert_942971" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="597" name="self.model.model.decoder.layers.2.encoder_attn.v_proj.weight/zero_point" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 1" offset="102206438" size="6400" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="598" name="Convert_942974" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="599" name="self.model.model.decoder.layers.2.encoder_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="600" name="self.model.model.decoder.layers.2.encoder_attn.v_proj.weight/scale" type="Const" version="opset1">
<data element_type="f16" shape="1280, 10, 1" offset="102212838" size="25600" />
<output>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="601" name="self.model.model.decoder.layers.2.encoder_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="602" name="Constant_942979" type="Const" version="opset1">
<data element_type="i64" shape="2" offset="851200" size="16" />
<output>
<port id="0" precision="I64">
<dim>2</dim>
</port>
</output>
</layer>
<layer id="603" name="Reshape_942980" type="Reshape" version="opset1">
<data special_zero="false" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="I64">
<dim>2</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="604" name="self.model.model.decoder.layers.2.encoder_attn.v_proj.weight/fq_weights_1/convert" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="605" name="__module.model.model.decoder.layers.2.encoder_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>-1</dim>
</port>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="606" name="Constant_34996" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1280" offset="102238438" size="5120" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="607" name="__module.model.model.decoder.layers.2.encoder_attn.v_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="422">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="608" name="__module.model.model.decoder.layers.2.encoder_attn/aten::view/Reshape_2" type="Reshape" version="opset1">
<data special_zero="false" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="424,value_states.21">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="609" name="__module.model.model.decoder.layers.2.encoder_attn/aten::transpose/Constant_2" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="856368" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="610" name="__module.model.model.decoder.layers.2.encoder_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="present.2.encoder.value">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="611" name="__module.model.model.decoder.layers.2.encoder_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13">
<data causal="false" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</input>
<output>
<port id="3" precision="FP32" names="429,attn_output.21">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="612" name="__module.model.model.decoder.layers.2.encoder_attn/aten::transpose/Constant_3" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="856368" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="613" name="__module.model.model.decoder.layers.2.encoder_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="430,attn_output.23">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="614" name="Constant_35424" type="Const" version="opset1">
<data element_type="i64" shape="3" offset="71400622" size="24" />
<output>
<port id="0" precision="I64">
<dim>3</dim>
</port>
</output>
</layer>
<layer id="615" name="__module.model.model.decoder.layers.2.encoder_attn/aten::reshape/Reshape" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
<port id="1" precision="I64">
<dim>3</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="432,input.63">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="616" name="self.model.model.decoder.layers.2.encoder_attn.out_proj.weight" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 128" offset="102243558" size="819200" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="617" name="Convert_1041848" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="618" name="self.model.model.decoder.layers.2.encoder_attn.out_proj.weight/zero_point" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 1" offset="103062758" size="6400" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="619" name="Convert_1041851" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="620" name="self.model.model.decoder.layers.2.encoder_attn.out_proj.weight/zero_point/subtract" type="Subtract" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="621" name="self.model.model.decoder.layers.2.encoder_attn.out_proj.weight/scale" type="Const" version="opset1">
<data element_type="f16" shape="1280, 10, 1" offset="103069158" size="25600" />
<output>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="622" name="self.model.model.decoder.layers.2.encoder_attn.out_proj.weight/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="623" name="Constant_1041856" type="Const" version="opset1">
<data element_type="i64" shape="2" offset="851200" size="16" />
<output>
<port id="0" precision="I64">
<dim>2</dim>
</port>
</output>
</layer>
<layer id="624" name="Reshape_1041857" type="Reshape" version="opset1">
<data special_zero="false" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="I64">
<dim>2</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="625" name="self.model.model.decoder.layers.2.encoder_attn.out_proj.weight/fq_weights_1/convert" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="626" name="__module.model.model.decoder.layers.2.encoder_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="627" name="Constant_34997" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1280" offset="103094758" size="5120" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="628" name="__module.model.model.decoder.layers.2.encoder_attn.out_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="435,437,input.65">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="629" name="__module.model.model.decoder.layers.2/aten::add/Add_1" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="441,input.67">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="630" name="__module.model.model.decoder.layers.2.final_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1">
<data element_type="i32" shape="1" offset="68826478" size="4" />
<output>
<port id="0" precision="I32">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="631" name="__module.model.model.decoder.layers.2.final_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6">
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="I32">
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="632" name="Constant_34998" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1280" offset="103099878" size="5120" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="633" name="__module.model.model.decoder.layers.2.final_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="634" name="Constant_34999" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1280" offset="103104998" size="5120" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="635" name="__module.model.model.decoder.layers.2.final_layer_norm/aten::layer_norm/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="445,input.69">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="636" name="self.model.model.decoder.layers.2.fc1.weight" type="Const" version="opset1">
<data element_type="u4" shape="5120, 10, 128" offset="103110118" size="3276800" />
<output>
<port id="0" precision="U4">
<dim>5120</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="637" name="Convert_917177" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>5120</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>5120</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="638" name="self.model.model.decoder.layers.2.fc1.weight/zero_point" type="Const" version="opset1">
<data element_type="u4" shape="5120, 10, 1" offset="106386918" size="25600" />
<output>
<port id="0" precision="U4">
<dim>5120</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="639" name="Convert_917180" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>5120</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>5120</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="640" name="self.model.model.decoder.layers.2.fc1.weight/zero_point/subtract" type="Subtract" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>5120</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>5120</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>5120</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="641" name="self.model.model.decoder.layers.2.fc1.weight/scale" type="Const" version="opset1">
<data element_type="f16" shape="5120, 10, 1" offset="106412518" size="102400" />
<output>
<port id="0" precision="FP16">
<dim>5120</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="642" name="self.model.model.decoder.layers.2.fc1.weight/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>5120</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>5120</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>5120</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="643" name="Constant_917185" type="Const" version="opset1">
<data element_type="i64" shape="2" offset="79102406" size="16" />
<output>
<port id="0" precision="I64">
<dim>2</dim>
</port>
</output>
</layer>
<layer id="644" name="Reshape_917186" type="Reshape" version="opset1">
<data special_zero="false" />
<input>
<port id="0" precision="FP16">
<dim>5120</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="I64">
<dim>2</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>5120</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="645" name="self.model.model.decoder.layers.2.fc1.weight/fq_weights_1/convert" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="FP16">
<dim>5120</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>5120</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="646" name="__module.model.model.decoder.layers.2.fc1/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>5120</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>5120</dim>
</port>
</output>
</layer>
<layer id="647" name="Constant_35000" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 5120" offset="106514918" size="20480" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>5120</dim>
</port>
</output>
</layer>
<layer id="648" name="__module.model.model.decoder.layers.2.fc1/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>5120</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>5120</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="448,input.71">
<dim>-1</dim>
<dim>-1</dim>
<dim>5120</dim>
</port>
</output>
</layer>
<layer id="649" name="__module.model.model.decoder.layers.2.activation_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
<data approximation_mode="ERF" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>5120</dim>
</port>
</input>
<output>
<port id="1" precision="FP32" names="449,input.73">
<dim>-1</dim>
<dim>-1</dim>
<dim>5120</dim>
</port>
</output>
</layer>
<layer id="650" name="self.model.model.decoder.layers.2.fc2.weight" type="Const" version="opset1">
<data element_type="u4" shape="1280, 40, 128" offset="106535398" size="3276800" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>40</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="651" name="Convert_921476" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>40</dim>
<dim>128</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>40</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="652" name="self.model.model.decoder.layers.2.fc2.weight/zero_point" type="Const" version="opset1">
<data element_type="u4" shape="1280, 40, 1" offset="109812198" size="25600" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>40</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="653" name="Convert_921479" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>40</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>40</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="654" name="self.model.model.decoder.layers.2.fc2.weight/zero_point/subtract" type="Subtract" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>40</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>40</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>40</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="655" name="self.model.model.decoder.layers.2.fc2.weight/scale" type="Const" version="opset1">
<data element_type="f16" shape="1280, 40, 1" offset="109837798" size="102400" />
<output>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>40</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="656" name="self.model.model.decoder.layers.2.fc2.weight/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>40</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>40</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>40</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="657" name="Constant_921484" type="Const" version="opset1">
<data element_type="i64" shape="2" offset="82527702" size="16" />
<output>
<port id="0" precision="I64">
<dim>2</dim>
</port>
</output>
</layer>
<layer id="658" name="Reshape_921485" type="Reshape" version="opset1">
<data special_zero="false" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>40</dim>
<dim>128</dim>
</port>
<port id="1" precision="I64">
<dim>2</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>5120</dim>
</port>
</output>
</layer>
<layer id="659" name="self.model.model.decoder.layers.2.fc2.weight/fq_weights_1/convert" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>5120</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>5120</dim>
</port>
</output>
</layer>
<layer id="660" name="__module.model.model.decoder.layers.2.fc2/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>5120</dim>
</port>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>5120</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="661" name="Constant_35001" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1280" offset="109940198" size="5120" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="662" name="__module.model.model.decoder.layers.2.fc2/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="453,input.77">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="663" name="__module.model.model.decoder.layers.2/aten::add/Add_2" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="455,457,input.79">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="664" name="__module.model.model.decoder.layers.3.self_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1">
<data element_type="i32" shape="1" offset="68826478" size="4" />
<output>
<port id="0" precision="I32">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="665" name="__module.model.model.decoder.layers.3.self_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6">
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="I32">
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="666" name="Constant_35002" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1280" offset="109945318" size="5120" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="667" name="__module.model.model.decoder.layers.3.self_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="668" name="Constant_35003" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1280" offset="109950438" size="5120" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="669" name="__module.model.model.decoder.layers.3.self_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="472,hidden_states.31">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="670" name="self.model.model.decoder.layers.3.self_attn.v_proj.weight" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 128" offset="109955558" size="819200" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="671" name="Convert_1046147" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="672" name="self.model.model.decoder.layers.3.self_attn.v_proj.weight/zero_point" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 1" offset="110774758" size="6400" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="673" name="Convert_1046150" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="674" name="self.model.model.decoder.layers.3.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="675" name="self.model.model.decoder.layers.3.self_attn.v_proj.weight/scale" type="Const" version="opset1">
<data element_type="f16" shape="1280, 10, 1" offset="110781158" size="25600" />
<output>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="676" name="self.model.model.decoder.layers.3.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="677" name="Constant_1046155" type="Const" version="opset1">
<data element_type="i64" shape="2" offset="851200" size="16" />
<output>
<port id="0" precision="I64">
<dim>2</dim>
</port>
</output>
</layer>
<layer id="678" name="Reshape_1046156" type="Reshape" version="opset1">
<data special_zero="false" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="I64">
<dim>2</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="679" name="self.model.model.decoder.layers.3.self_attn.v_proj.weight/fq_weights_1/convert" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="680" name="__module.model.model.decoder.layers.3.self_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="681" name="Constant_35005" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1280" offset="110806758" size="5120" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="682" name="__module.model.model.decoder.layers.3.self_attn.v_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="492">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="683" name="Constant_35425" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="69693042" size="32" />
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="684" name="__module.model.model.decoder.layers.3.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="494,value_states.25">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="685" name="__module.model.model.decoder.layers.3.self_attn/aten::transpose/Constant_2" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="856368" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="686" name="__module.model.model.decoder.layers.3.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="present.3.decoder.value">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="688" name="self.model.model.decoder.layers.3.self_attn.k_proj.weight" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 128" offset="110811878" size="819200" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="689" name="Convert_1050446" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="690" name="self.model.model.decoder.layers.3.self_attn.k_proj.weight/zero_point" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 1" offset="111631078" size="6400" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="691" name="Convert_1050449" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="692" name="self.model.model.decoder.layers.3.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="693" name="self.model.model.decoder.layers.3.self_attn.k_proj.weight/scale" type="Const" version="opset1">
<data element_type="f16" shape="1280, 10, 1" offset="111637478" size="25600" />
<output>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="694" name="self.model.model.decoder.layers.3.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="695" name="Constant_1050454" type="Const" version="opset1">
<data element_type="i64" shape="2" offset="851200" size="16" />
<output>
<port id="0" precision="I64">
<dim>2</dim>
</port>
</output>
</layer>
<layer id="696" name="Reshape_1050455" type="Reshape" version="opset1">
<data special_zero="false" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="I64">
<dim>2</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="697" name="self.model.model.decoder.layers.3.self_attn.k_proj.weight/fq_weights_1/convert" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="698" name="__module.model.model.decoder.layers.3.self_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="487">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="699" name="Constant_35426" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="69693042" size="32" />
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="700" name="__module.model.model.decoder.layers.3.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="489,key_states.25">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="701" name="__module.model.model.decoder.layers.3.self_attn/aten::transpose/Constant_1" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="856368" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="702" name="__module.model.model.decoder.layers.3.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="present.3.decoder.key">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="716" name="self.model.model.decoder.layers.3.self_attn.q_proj.weight" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 128" offset="111663078" size="819200" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="717" name="Convert_1054745" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="718" name="self.model.model.decoder.layers.3.self_attn.q_proj.weight/zero_point" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 1" offset="112482278" size="6400" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="719" name="Convert_1054748" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="720" name="self.model.model.decoder.layers.3.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="721" name="self.model.model.decoder.layers.3.self_attn.q_proj.weight/scale" type="Const" version="opset1">
<data element_type="f16" shape="1280, 10, 1" offset="112488678" size="25600" />
<output>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="722" name="self.model.model.decoder.layers.3.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="723" name="Constant_1054753" type="Const" version="opset1">
<data element_type="i64" shape="2" offset="851200" size="16" />
<output>
<port id="0" precision="I64">
<dim>2</dim>
</port>
</output>
</layer>
<layer id="724" name="Reshape_1054754" type="Reshape" version="opset1">
<data special_zero="false" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="I64">
<dim>2</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="725" name="self.model.model.decoder.layers.3.self_attn.q_proj.weight/fq_weights_1/convert" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="726" name="__module.model.model.decoder.layers.3.self_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="727" name="Constant_35004" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1280" offset="112514278" size="5120" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="728" name="__module.model.model.decoder.layers.3.self_attn.q_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="481">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="729" name="Constant_35427" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="69693042" size="32" />
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="730" name="__module.model.model.decoder.layers.3.self_attn/aten::view/Reshape" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="483,query_states.25">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="731" name="__module.model.model.decoder.layers.3.self_attn/aten::transpose/Constant" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="856368" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="732" name="__module.model.model.decoder.layers.3.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="484">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="733" name="__module.model.model.decoder.layers.3.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13">
<data causal="false" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
<port id="3" precision="FP32">
<dim>-1</dim>
<dim>1</dim>
<dim>-1</dim>
<dim>-1</dim>
</port>
</input>
<output>
<port id="4" precision="FP32" names="504,attn_output.25">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="734" name="__module.model.model.decoder.layers.3.self_attn/aten::transpose/Constant_3" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="856368" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="735" name="__module.model.model.decoder.layers.3.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="505,attn_output.27">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="736" name="Constant_35428" type="Const" version="opset1">
<data element_type="i64" shape="3" offset="71400622" size="24" />
<output>
<port id="0" precision="I64">
<dim>3</dim>
</port>
</output>
</layer>
<layer id="737" name="__module.model.model.decoder.layers.3.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
<port id="1" precision="I64">
<dim>3</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="507,input.81">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="738" name="self.model.model.decoder.layers.3.self_attn.out_proj.weight" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 128" offset="112519398" size="819200" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="739" name="Convert_1059044" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="740" name="self.model.model.decoder.layers.3.self_attn.out_proj.weight/zero_point" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 1" offset="113338598" size="6400" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="741" name="Convert_1059047" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="742" name="self.model.model.decoder.layers.3.self_attn.out_proj.weight/zero_point/subtract" type="Subtract" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="743" name="self.model.model.decoder.layers.3.self_attn.out_proj.weight/scale" type="Const" version="opset1">
<data element_type="f16" shape="1280, 10, 1" offset="113344998" size="25600" />
<output>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="744" name="self.model.model.decoder.layers.3.self_attn.out_proj.weight/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="745" name="Constant_1059052" type="Const" version="opset1">
<data element_type="i64" shape="2" offset="851200" size="16" />
<output>
<port id="0" precision="I64">
<dim>2</dim>
</port>
</output>
</layer>
<layer id="746" name="Reshape_1059053" type="Reshape" version="opset1">
<data special_zero="false" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="I64">
<dim>2</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="747" name="self.model.model.decoder.layers.3.self_attn.out_proj.weight/fq_weights_1/convert" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="748" name="__module.model.model.decoder.layers.3.self_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="749" name="Constant_35006" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1280" offset="113370598" size="5120" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="750" name="__module.model.model.decoder.layers.3.self_attn.out_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="510,512,input.83">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="751" name="__module.model.model.decoder.layers.3/aten::add/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="516,input.85">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="752" name="__module.model.model.decoder.layers.3.encoder_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1">
<data element_type="i32" shape="1" offset="68826478" size="4" />
<output>
<port id="0" precision="I32">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="753" name="__module.model.model.decoder.layers.3.encoder_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6">
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="I32">
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="754" name="Constant_35007" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1280" offset="113375718" size="5120" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="755" name="__module.model.model.decoder.layers.3.encoder_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="756" name="Constant_35008" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1280" offset="113380838" size="5120" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="757" name="__module.model.model.decoder.layers.3.encoder_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="520,hidden_states.35">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="758" name="self.model.model.decoder.layers.3.encoder_attn.q_proj.weight" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 128" offset="113385958" size="819200" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="759" name="Convert_1063343" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="760" name="self.model.model.decoder.layers.3.encoder_attn.q_proj.weight/zero_point" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 1" offset="114205158" size="6400" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="761" name="Convert_1063346" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="762" name="self.model.model.decoder.layers.3.encoder_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="763" name="self.model.model.decoder.layers.3.encoder_attn.q_proj.weight/scale" type="Const" version="opset1">
<data element_type="f16" shape="1280, 10, 1" offset="114211558" size="25600" />
<output>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="764" name="self.model.model.decoder.layers.3.encoder_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="765" name="Constant_1063351" type="Const" version="opset1">
<data element_type="i64" shape="2" offset="851200" size="16" />
<output>
<port id="0" precision="I64">
<dim>2</dim>
</port>
</output>
</layer>
<layer id="766" name="Reshape_1063352" type="Reshape" version="opset1">
<data special_zero="false" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="I64">
<dim>2</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="767" name="self.model.model.decoder.layers.3.encoder_attn.q_proj.weight/fq_weights_1/convert" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="768" name="__module.model.model.decoder.layers.3.encoder_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="769" name="Constant_35009" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1280" offset="114237158" size="5120" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="770" name="__module.model.model.decoder.layers.3.encoder_attn.q_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="529">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="771" name="Constant_35429" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="69693042" size="32" />
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="772" name="__module.model.model.decoder.layers.3.encoder_attn/aten::view/Reshape_2" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="531,query_states.29">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="773" name="__module.model.model.decoder.layers.3.encoder_attn/aten::transpose/Constant_2" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="856368" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="774" name="__module.model.model.decoder.layers.3.encoder_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="532">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="775" name="__module.model.model.decoder.layers.3.encoder_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13">
<data causal="false" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</input>
<output>
<port id="3" precision="FP32" names="547,attn_output.29">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="776" name="__module.model.model.decoder.layers.3.encoder_attn/aten::transpose/Constant_3" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="856368" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="777" name="__module.model.model.decoder.layers.3.encoder_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="548,attn_output">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="778" name="Constant_35430" type="Const" version="opset1">
<data element_type="i64" shape="3" offset="71400622" size="24" />
<output>
<port id="0" precision="I64">
<dim>3</dim>
</port>
</output>
</layer>
<layer id="779" name="__module.model.model.decoder.layers.3.encoder_attn/aten::reshape/Reshape" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>20</dim>
<dim>64</dim>
</port>
<port id="1" precision="I64">
<dim>3</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="550,input.87">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="780" name="self.model.model.decoder.layers.3.encoder_attn.out_proj.weight" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 128" offset="114242278" size="819200" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="781" name="Convert_1067642" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="782" name="self.model.model.decoder.layers.3.encoder_attn.out_proj.weight/zero_point" type="Const" version="opset1">
<data element_type="u4" shape="1280, 10, 1" offset="115061478" size="6400" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="783" name="Convert_1067645" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="784" name="self.model.model.decoder.layers.3.encoder_attn.out_proj.weight/zero_point/subtract" type="Subtract" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="785" name="self.model.model.decoder.layers.3.encoder_attn.out_proj.weight/scale" type="Const" version="opset1">
<data element_type="f16" shape="1280, 10, 1" offset="115067878" size="25600" />
<output>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="786" name="self.model.model.decoder.layers.3.encoder_attn.out_proj.weight/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="787" name="Constant_1067650" type="Const" version="opset1">
<data element_type="i64" shape="2" offset="851200" size="16" />
<output>
<port id="0" precision="I64">
<dim>2</dim>
</port>
</output>
</layer>
<layer id="788" name="Reshape_1067651" type="Reshape" version="opset1">
<data special_zero="false" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="I64">
<dim>2</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="789" name="self.model.model.decoder.layers.3.encoder_attn.out_proj.weight/fq_weights_1/convert" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="790" name="__module.model.model.decoder.layers.3.encoder_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="791" name="Constant_35010" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1280" offset="115093478" size="5120" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="792" name="__module.model.model.decoder.layers.3.encoder_attn.out_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="553,555,input.89">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="793" name="__module.model.model.decoder.layers.3/aten::add/Add_1" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="559,input.91">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="794" name="__module.model.model.decoder.layers.3.final_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1">
<data element_type="i32" shape="1" offset="68826478" size="4" />
<output>
<port id="0" precision="I32">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="795" name="__module.model.model.decoder.layers.3.final_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6">
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="I32">
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="796" name="Constant_35011" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1280" offset="115098598" size="5120" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="797" name="__module.model.model.decoder.layers.3.final_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="798" name="Constant_35012" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1280" offset="115103718" size="5120" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="799" name="__module.model.model.decoder.layers.3.final_layer_norm/aten::layer_norm/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="563,input.93">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="800" name="self.model.model.decoder.layers.3.fc1.weight" type="Const" version="opset1">
<data element_type="u4" shape="5120, 10, 128" offset="115108838" size="3276800" />
<output>
<port id="0" precision="U4">
<dim>5120</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="801" name="Convert_925775" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>5120</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>5120</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="802" name="self.model.model.decoder.layers.3.fc1.weight/zero_point" type="Const" version="opset1">
<data element_type="u4" shape="5120, 10, 1" offset="118385638" size="25600" />
<output>
<port id="0" precision="U4">
<dim>5120</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="803" name="Convert_925778" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>5120</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>5120</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="804" name="self.model.model.decoder.layers.3.fc1.weight/zero_point/subtract" type="Subtract" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>5120</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>5120</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>5120</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="805" name="self.model.model.decoder.layers.3.fc1.weight/scale" type="Const" version="opset1">
<data element_type="f16" shape="5120, 10, 1" offset="118411238" size="102400" />
<output>
<port id="0" precision="FP16">
<dim>5120</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="806" name="self.model.model.decoder.layers.3.fc1.weight/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>5120</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>5120</dim>
<dim>10</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>5120</dim>
<dim>10</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="807" name="Constant_925783" type="Const" version="opset1">
<data element_type="i64" shape="2" offset="79102406" size="16" />
<output>
<port id="0" precision="I64">
<dim>2</dim>
</port>
</output>
</layer>
<layer id="808" name="Reshape_925784" type="Reshape" version="opset1">
<data special_zero="false" />
<input>
<port id="0" precision="FP16">
<dim>5120</dim>
<dim>10</dim>
<dim>128</dim>
</port>
<port id="1" precision="I64">
<dim>2</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>5120</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="809" name="self.model.model.decoder.layers.3.fc1.weight/fq_weights_1/convert" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="FP16">
<dim>5120</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>5120</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="810" name="__module.model.model.decoder.layers.3.fc1/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>5120</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>5120</dim>
</port>
</output>
</layer>
<layer id="811" name="Constant_35013" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 5120" offset="118513638" size="20480" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>5120</dim>
</port>
</output>
</layer>
<layer id="812" name="__module.model.model.decoder.layers.3.fc1/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>5120</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>5120</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="566,input.95">
<dim>-1</dim>
<dim>-1</dim>
<dim>5120</dim>
</port>
</output>
</layer>
<layer id="813" name="__module.model.model.decoder.layers.3.activation_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
<data approximation_mode="ERF" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>5120</dim>
</port>
</input>
<output>
<port id="1" precision="FP32" names="567,input.97">
<dim>-1</dim>
<dim>-1</dim>
<dim>5120</dim>
</port>
</output>
</layer>
<layer id="814" name="self.model.model.decoder.layers.3.fc2.weight" type="Const" version="opset1">
<data element_type="u4" shape="1280, 40, 128" offset="118534118" size="3276800" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>40</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="815" name="Convert_930074" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>40</dim>
<dim>128</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>40</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="816" name="self.model.model.decoder.layers.3.fc2.weight/zero_point" type="Const" version="opset1">
<data element_type="u4" shape="1280, 40, 1" offset="121810918" size="25600" />
<output>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>40</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="817" name="Convert_930077" type="Convert" version="opset1">
<data destination_type="f16" />
<input>
<port id="0" precision="U4">
<dim>1280</dim>
<dim>40</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>40</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="818" name="self.model.model.decoder.layers.3.fc2.weight/zero_point/subtract" type="Subtract" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>40</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>40</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>40</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="819" name="self.model.model.decoder.layers.3.fc2.weight/scale" type="Const" version="opset1">
<data element_type="f16" shape="1280, 40, 1" offset="121836518" size="102400" />
<output>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>40</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="820" name="self.model.model.decoder.layers.3.fc2.weight/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>40</dim>
<dim>128</dim>
</port>
<port id="1" precision="FP16">
<dim>1280</dim>
<dim>40</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>40</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="821" name="Constant_930082" type="Const" version="opset1">
<data element_type="i64" shape="2" offset="82527702" size="16" />
<output>
<port id="0" precision="I64">
<dim>2</dim>
</port>
</output>
</layer>
<layer id="822" name="Reshape_930083" type="Reshape" version="opset1">
<data special_zero="false" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>40</dim>
<dim>128</dim>
</port>
<port id="1" precision="I64">
<dim>2</dim>
</port>
</input>
<output>
<port id="2" precision="FP16">
<dim>1280</dim>
<dim>5120</dim>
</port>
</output>
</layer>
<layer id="823" name="self.model.model.decoder.layers.3.fc2.weight/fq_weights_1/convert" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="FP16">
<dim>1280</dim>
<dim>5120</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>5120</dim>
</port>
</output>
</layer>
<layer id="824" name="__module.model.model.decoder.layers.3.fc2/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>5120</dim>
</port>
<port id="1" precision="FP32">
<dim>1280</dim>
<dim>5120</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="825" name="Constant_35014" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1280" offset="121938918" size="5120" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="826" name="__module.model.model.decoder.layers.3.fc2/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="571,input.101">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="827" name="__module.model.model.decoder.layers.3/aten::add/Add_2" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="573,575,input.103">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="828" name="__module.model.model.decoder.layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1">
<data element_type="i32" shape="1" offset="68826478" size="4" />
<output>
<port id="0" precision="I32">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="829" name="__module.model.model.decoder.layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6">
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="I32">
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="830" name="Constant_35015" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1280" offset="121944038" size="5120" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="831" name="__module.model.model.decoder.layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="832" name="Constant_35016" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1280" offset="121949158" size="5120" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="833" name="__module.model.model.decoder.layer_norm/aten::layer_norm/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="583,585,603,input">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
</output>
</layer>
<layer id="834" name="__module.model.proj_out/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1280</dim>
</port>
<port id="1" precision="FP32">
<dim>51866</dim>
<dim>1280</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="logits">
<dim>-1</dim>
<dim>-1</dim>
<dim>51866</dim>
</port>
</output>
</layer>
<layer id="835" name="Result_27358" type="Result" version="opset1" output_names="logits">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>51866</dim>
</port>
</input>
</layer>
<layer id="715" name="Result_27366" type="Result" version="opset1" output_names="present.0.decoder.key">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</input>
</layer>
<layer id="714" name="Result_27365" type="Result" version="opset1" output_names="present.0.decoder.value">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</input>
</layer>
<layer id="713" name="Result_27364" type="Result" version="opset1" output_names="present.0.encoder.key">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</input>
</layer>
<layer id="712" name="Result_27363" type="Result" version="opset1" output_names="present.0.encoder.value">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</input>
</layer>
<layer id="711" name="Result_27370" type="Result" version="opset1" output_names="present.1.decoder.key">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</input>
</layer>
<layer id="710" name="Result_27369" type="Result" version="opset1" output_names="present.1.decoder.value">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</input>
</layer>
<layer id="709" name="Result_27368" type="Result" version="opset1" output_names="present.1.encoder.key">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</input>
</layer>
<layer id="708" name="Result_27367" type="Result" version="opset1" output_names="present.1.encoder.value">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</input>
</layer>
<layer id="707" name="Result_27374" type="Result" version="opset1" output_names="present.2.decoder.key">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</input>
</layer>
<layer id="706" name="Result_27373" type="Result" version="opset1" output_names="present.2.decoder.value">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</input>
</layer>
<layer id="705" name="Result_27372" type="Result" version="opset1" output_names="present.2.encoder.key">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</input>
</layer>
<layer id="704" name="Result_27371" type="Result" version="opset1" output_names="present.2.encoder.value">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</input>
</layer>
<layer id="703" name="Result_27378" type="Result" version="opset1" output_names="present.3.decoder.key">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</input>
</layer>
<layer id="687" name="Result_27377" type="Result" version="opset1" output_names="present.3.decoder.value">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</input>
</layer>
<layer id="41" name="Result_27376" type="Result" version="opset1" output_names="present.3.encoder.key">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</input>
</layer>
<layer id="26" name="Result_27375" type="Result" version="opset1" output_names="present.3.encoder.value">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>20</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</input>
</layer>
</layers>
<edges>
<edge from-layer="0" from-port="0" to-layer="245" to-port="0" />
<edge from-layer="0" from-port="0" to-layer="231" to-port="0" />
<edge from-layer="0" from-port="0" to-layer="411" to-port="0" />
<edge from-layer="0" from-port="0" to-layer="425" to-port="0" />
<edge from-layer="0" from-port="0" to-layer="605" to-port="0" />
<edge from-layer="0" from-port="0" to-layer="591" to-port="0" />
<edge from-layer="0" from-port="0" to-layer="12" to-port="0" />
<edge from-layer="0" from-port="0" to-layer="37" to-port="0" />
<edge from-layer="1" from-port="0" to-layer="51" to-port="0" />
<edge from-layer="1" from-port="0" to-layer="15" to-port="0" />
<edge from-layer="2" from-port="0" to-layer="3" to-port="0" />
<edge from-layer="3" from-port="1" to-layer="6" to-port="0" />
<edge from-layer="4" from-port="0" to-layer="5" to-port="0" />
<edge from-layer="5" from-port="1" to-layer="6" to-port="1" />
<edge from-layer="6" from-port="2" to-layer="8" to-port="0" />
<edge from-layer="7" from-port="0" to-layer="8" to-port="1" />
<edge from-layer="8" from-port="2" to-layer="10" to-port="0" />
<edge from-layer="9" from-port="0" to-layer="10" to-port="1" />
<edge from-layer="10" from-port="2" to-layer="11" to-port="0" />
<edge from-layer="11" from-port="1" to-layer="12" to-port="1" />
<edge from-layer="12" from-port="2" to-layer="14" to-port="0" />
<edge from-layer="13" from-port="0" to-layer="14" to-port="1" />
<edge from-layer="14" from-port="2" to-layer="23" to-port="0" />
<edge from-layer="15" from-port="1" to-layer="18" to-port="0" />
<edge from-layer="15" from-port="1" to-layer="66" to-port="0" />
<edge from-layer="16" from-port="0" to-layer="18" to-port="1" />
<edge from-layer="17" from-port="0" to-layer="18" to-port="2" />
<edge from-layer="18" from-port="3" to-layer="22" to-port="0" />
<edge from-layer="18" from-port="3" to-layer="173" to-port="0" />
<edge from-layer="18" from-port="3" to-layer="71" to-port="0" />
<edge from-layer="19" from-port="0" to-layer="22" to-port="1" />
<edge from-layer="20" from-port="0" to-layer="22" to-port="2" />
<edge from-layer="21" from-port="0" to-layer="22" to-port="3" />
<edge from-layer="22" from-port="4" to-layer="428" to-port="1" />
<edge from-layer="22" from-port="4" to-layer="608" to-port="1" />
<edge from-layer="22" from-port="4" to-layer="592" to-port="1" />
<edge from-layer="22" from-port="4" to-layer="38" to-port="1" />
<edge from-layer="22" from-port="4" to-layer="248" to-port="1" />
<edge from-layer="22" from-port="4" to-layer="232" to-port="1" />
<edge from-layer="22" from-port="4" to-layer="23" to-port="1" />
<edge from-layer="22" from-port="4" to-layer="412" to-port="1" />
<edge from-layer="23" from-port="2" to-layer="25" to-port="0" />
<edge from-layer="24" from-port="0" to-layer="25" to-port="1" />
<edge from-layer="25" from-port="2" to-layer="26" to-port="0" />
<edge from-layer="25" from-port="2" to-layer="775" to-port="2" />
<edge from-layer="27" from-port="0" to-layer="28" to-port="0" />
<edge from-layer="28" from-port="1" to-layer="31" to-port="0" />
<edge from-layer="29" from-port="0" to-layer="30" to-port="0" />
<edge from-layer="30" from-port="1" to-layer="31" to-port="1" />
<edge from-layer="31" from-port="2" to-layer="33" to-port="0" />
<edge from-layer="32" from-port="0" to-layer="33" to-port="1" />
<edge from-layer="33" from-port="2" to-layer="35" to-port="0" />
<edge from-layer="34" from-port="0" to-layer="35" to-port="1" />
<edge from-layer="35" from-port="2" to-layer="36" to-port="0" />
<edge from-layer="36" from-port="1" to-layer="37" to-port="1" />
<edge from-layer="37" from-port="2" to-layer="38" to-port="0" />
<edge from-layer="38" from-port="2" to-layer="40" to-port="0" />
<edge from-layer="39" from-port="0" to-layer="40" to-port="1" />
<edge from-layer="40" from-port="2" to-layer="775" to-port="1" />
<edge from-layer="40" from-port="2" to-layer="41" to-port="0" />
<edge from-layer="42" from-port="0" to-layer="43" to-port="0" />
<edge from-layer="43" from-port="1" to-layer="46" to-port="0" />
<edge from-layer="44" from-port="0" to-layer="45" to-port="0" />
<edge from-layer="45" from-port="1" to-layer="46" to-port="1" />
<edge from-layer="46" from-port="2" to-layer="48" to-port="0" />
<edge from-layer="47" from-port="0" to-layer="48" to-port="1" />
<edge from-layer="48" from-port="2" to-layer="49" to-port="0" />
<edge from-layer="49" from-port="1" to-layer="54" to-port="0" />
<edge from-layer="49" from-port="1" to-layer="834" to-port="1" />
<edge from-layer="50" from-port="0" to-layer="51" to-port="1" />
<edge from-layer="51" from-port="2" to-layer="52" to-port="0" />
<edge from-layer="52" from-port="1" to-layer="54" to-port="1" />
<edge from-layer="53" from-port="0" to-layer="54" to-port="2" />
<edge from-layer="54" from-port="3" to-layer="76" to-port="0" />
<edge from-layer="55" from-port="0" to-layer="56" to-port="0" />
<edge from-layer="56" from-port="1" to-layer="59" to-port="0" />
<edge from-layer="57" from-port="0" to-layer="58" to-port="0" />
<edge from-layer="58" from-port="1" to-layer="59" to-port="1" />
<edge from-layer="59" from-port="2" to-layer="61" to-port="0" />
<edge from-layer="60" from-port="0" to-layer="61" to-port="1" />
<edge from-layer="61" from-port="2" to-layer="62" to-port="0" />
<edge from-layer="62" from-port="1" to-layer="75" to-port="0" />
<edge from-layer="63" from-port="0" to-layer="69" to-port="1" />
<edge from-layer="63" from-port="0" to-layer="167" to-port="1" />
<edge from-layer="63" from-port="0" to-layer="68" to-port="0" />
<edge from-layer="64" from-port="0" to-layer="66" to-port="1" />
<edge from-layer="65" from-port="0" to-layer="66" to-port="2" />
<edge from-layer="66" from-port="3" to-layer="150" to-port="0" />
<edge from-layer="66" from-port="3" to-layer="68" to-port="1" />
<edge from-layer="66" from-port="3" to-layer="137" to-port="0" />
<edge from-layer="66" from-port="3" to-layer="135" to-port="0" />
<edge from-layer="67" from-port="0" to-layer="68" to-port="2" />
<edge from-layer="68" from-port="3" to-layer="163" to-port="0" />
<edge from-layer="68" from-port="3" to-layer="69" to-port="0" />
<edge from-layer="69" from-port="2" to-layer="72" to-port="0" />
<edge from-layer="70" from-port="0" to-layer="71" to-port="1" />
<edge from-layer="71" from-port="2" to-layer="72" to-port="1" />
<edge from-layer="72" from-port="2" to-layer="73" to-port="0" />
<edge from-layer="73" from-port="1" to-layer="75" to-port="1" />
<edge from-layer="74" from-port="0" to-layer="75" to-port="2" />
<edge from-layer="75" from-port="3" to-layer="76" to-port="1" />
<edge from-layer="76" from-port="2" to-layer="197" to-port="0" />
<edge from-layer="76" from-port="2" to-layer="78" to-port="0" />
<edge from-layer="77" from-port="0" to-layer="78" to-port="1" />
<edge from-layer="78" from-port="2" to-layer="80" to-port="0" />
<edge from-layer="79" from-port="0" to-layer="80" to-port="1" />
<edge from-layer="80" from-port="2" to-layer="82" to-port="0" />
<edge from-layer="81" from-port="0" to-layer="82" to-port="1" />
<edge from-layer="82" from-port="2" to-layer="125" to-port="0" />
<edge from-layer="82" from-port="2" to-layer="93" to-port="0" />
<edge from-layer="82" from-port="2" to-layer="110" to-port="0" />
<edge from-layer="83" from-port="0" to-layer="84" to-port="0" />
<edge from-layer="84" from-port="1" to-layer="87" to-port="0" />
<edge from-layer="85" from-port="0" to-layer="86" to-port="0" />
<edge from-layer="86" from-port="1" to-layer="87" to-port="1" />
<edge from-layer="87" from-port="2" to-layer="89" to-port="0" />
<edge from-layer="88" from-port="0" to-layer="89" to-port="1" />
<edge from-layer="89" from-port="2" to-layer="91" to-port="0" />
<edge from-layer="90" from-port="0" to-layer="91" to-port="1" />
<edge from-layer="91" from-port="2" to-layer="92" to-port="0" />
<edge from-layer="92" from-port="1" to-layer="93" to-port="1" />
<edge from-layer="93" from-port="2" to-layer="95" to-port="0" />
<edge from-layer="94" from-port="0" to-layer="95" to-port="1" />
<edge from-layer="95" from-port="2" to-layer="97" to-port="0" />
<edge from-layer="96" from-port="0" to-layer="97" to-port="1" />
<edge from-layer="97" from-port="2" to-layer="99" to-port="0" />
<edge from-layer="98" from-port="0" to-layer="99" to-port="1" />
<edge from-layer="99" from-port="2" to-layer="179" to-port="0" />
<edge from-layer="100" from-port="0" to-layer="101" to-port="0" />
<edge from-layer="101" from-port="1" to-layer="104" to-port="0" />
<edge from-layer="102" from-port="0" to-layer="103" to-port="0" />
<edge from-layer="103" from-port="1" to-layer="104" to-port="1" />
<edge from-layer="104" from-port="2" to-layer="106" to-port="0" />
<edge from-layer="105" from-port="0" to-layer="106" to-port="1" />
<edge from-layer="106" from-port="2" to-layer="108" to-port="0" />
<edge from-layer="107" from-port="0" to-layer="108" to-port="1" />
<edge from-layer="108" from-port="2" to-layer="109" to-port="0" />
<edge from-layer="109" from-port="1" to-layer="110" to-port="1" />
<edge from-layer="110" from-port="2" to-layer="112" to-port="0" />
<edge from-layer="111" from-port="0" to-layer="112" to-port="1" />
<edge from-layer="112" from-port="2" to-layer="114" to-port="0" />
<edge from-layer="113" from-port="0" to-layer="114" to-port="1" />
<edge from-layer="114" from-port="2" to-layer="179" to-port="1" />
<edge from-layer="114" from-port="2" to-layer="715" to-port="0" />
<edge from-layer="115" from-port="0" to-layer="116" to-port="0" />
<edge from-layer="116" from-port="1" to-layer="119" to-port="0" />
<edge from-layer="117" from-port="0" to-layer="118" to-port="0" />
<edge from-layer="118" from-port="1" to-layer="119" to-port="1" />
<edge from-layer="119" from-port="2" to-layer="121" to-port="0" />
<edge from-layer="120" from-port="0" to-layer="121" to-port="1" />
<edge from-layer="121" from-port="2" to-layer="123" to-port="0" />
<edge from-layer="122" from-port="0" to-layer="123" to-port="1" />
<edge from-layer="123" from-port="2" to-layer="124" to-port="0" />
<edge from-layer="124" from-port="1" to-layer="125" to-port="1" />
<edge from-layer="125" from-port="2" to-layer="127" to-port="0" />
<edge from-layer="126" from-port="0" to-layer="127" to-port="1" />
<edge from-layer="127" from-port="2" to-layer="129" to-port="0" />
<edge from-layer="128" from-port="0" to-layer="129" to-port="1" />
<edge from-layer="129" from-port="2" to-layer="131" to-port="0" />
<edge from-layer="130" from-port="0" to-layer="131" to-port="1" />
<edge from-layer="131" from-port="2" to-layer="179" to-port="2" />
<edge from-layer="131" from-port="2" to-layer="714" to-port="0" />
<edge from-layer="132" from-port="0" to-layer="147" to-port="0" />
<edge from-layer="132" from-port="0" to-layer="148" to-port="1" />
<edge from-layer="133" from-port="0" to-layer="141" to-port="0" />
<edge from-layer="134" from-port="0" to-layer="135" to-port="1" />
<edge from-layer="135" from-port="2" to-layer="178" to-port="2" />
<edge from-layer="135" from-port="2" to-layer="140" to-port="0" />
<edge from-layer="136" from-port="0" to-layer="137" to-port="1" />
<edge from-layer="137" from-port="2" to-layer="139" to-port="0" />
<edge from-layer="137" from-port="2" to-layer="159" to-port="1" />
<edge from-layer="138" from-port="0" to-layer="139" to-port="1" />
<edge from-layer="139" from-port="2" to-layer="140" to-port="1" />
<edge from-layer="140" from-port="2" to-layer="141" to-port="1" />
<edge from-layer="141" from-port="2" to-layer="142" to-port="0" />
<edge from-layer="141" from-port="2" to-layer="156" to-port="1" />
<edge from-layer="142" from-port="1" to-layer="145" to-port="0" />
<edge from-layer="143" from-port="0" to-layer="145" to-port="1" />
<edge from-layer="144" from-port="0" to-layer="145" to-port="2" />
<edge from-layer="145" from-port="3" to-layer="147" to-port="1" />
<edge from-layer="146" from-port="0" to-layer="152" to-port="2" />
<edge from-layer="146" from-port="0" to-layer="147" to-port="2" />
<edge from-layer="146" from-port="0" to-layer="153" to-port="1" />
<edge from-layer="147" from-port="3" to-layer="148" to-port="0" />
<edge from-layer="148" from-port="2" to-layer="154" to-port="0" />
<edge from-layer="149" from-port="0" to-layer="152" to-port="0" />
<edge from-layer="149" from-port="0" to-layer="151" to-port="1" />
<edge from-layer="150" from-port="1" to-layer="151" to-port="0" />
<edge from-layer="151" from-port="2" to-layer="152" to-port="1" />
<edge from-layer="152" from-port="3" to-layer="153" to-port="0" />
<edge from-layer="153" from-port="2" to-layer="154" to-port="1" />
<edge from-layer="154" from-port="2" to-layer="156" to-port="0" />
<edge from-layer="155" from-port="0" to-layer="156" to-port="2" />
<edge from-layer="156" from-port="3" to-layer="166" to-port="0" />
<edge from-layer="157" from-port="0" to-layer="159" to-port="0" />
<edge from-layer="158" from-port="0" to-layer="159" to-port="2" />
<edge from-layer="159" from-port="3" to-layer="160" to-port="0" />
<edge from-layer="160" from-port="1" to-layer="161" to-port="0" />
<edge from-layer="161" from-port="1" to-layer="164" to-port="0" />
<edge from-layer="162" from-port="0" to-layer="163" to-port="1" />
<edge from-layer="163" from-port="2" to-layer="164" to-port="1" />
<edge from-layer="164" from-port="2" to-layer="165" to-port="0" />
<edge from-layer="165" from-port="1" to-layer="166" to-port="1" />
<edge from-layer="166" from-port="2" to-layer="167" to-port="0" />
<edge from-layer="167" from-port="2" to-layer="169" to-port="0" />
<edge from-layer="168" from-port="0" to-layer="169" to-port="1" />
<edge from-layer="169" from-port="2" to-layer="174" to-port="0" />
<edge from-layer="170" from-port="0" to-layer="173" to-port="1" />
<edge from-layer="171" from-port="0" to-layer="173" to-port="2" />
<edge from-layer="172" from-port="0" to-layer="173" to-port="3" />
<edge from-layer="173" from-port="4" to-layer="174" to-port="1" />
<edge from-layer="174" from-port="2" to-layer="178" to-port="0" />
<edge from-layer="175" from-port="0" to-layer="178" to-port="1" />
<edge from-layer="176" from-port="0" to-layer="178" to-port="3" />
<edge from-layer="177" from-port="0" to-layer="178" to-port="4" />
<edge from-layer="178" from-port="5" to-layer="359" to-port="3" />
<edge from-layer="178" from-port="5" to-layer="539" to-port="3" />
<edge from-layer="178" from-port="5" to-layer="179" to-port="3" />
<edge from-layer="178" from-port="5" to-layer="733" to-port="3" />
<edge from-layer="179" from-port="4" to-layer="181" to-port="0" />
<edge from-layer="180" from-port="0" to-layer="181" to-port="1" />
<edge from-layer="181" from-port="2" to-layer="183" to-port="0" />
<edge from-layer="182" from-port="0" to-layer="183" to-port="1" />
<edge from-layer="183" from-port="2" to-layer="194" to-port="0" />
<edge from-layer="184" from-port="0" to-layer="185" to-port="0" />
<edge from-layer="185" from-port="1" to-layer="188" to-port="0" />
<edge from-layer="186" from-port="0" to-layer="187" to-port="0" />
<edge from-layer="187" from-port="1" to-layer="188" to-port="1" />
<edge from-layer="188" from-port="2" to-layer="190" to-port="0" />
<edge from-layer="189" from-port="0" to-layer="190" to-port="1" />
<edge from-layer="190" from-port="2" to-layer="192" to-port="0" />
<edge from-layer="191" from-port="0" to-layer="192" to-port="1" />
<edge from-layer="192" from-port="2" to-layer="193" to-port="0" />
<edge from-layer="193" from-port="1" to-layer="194" to-port="1" />
<edge from-layer="194" from-port="2" to-layer="196" to-port="0" />
<edge from-layer="195" from-port="0" to-layer="196" to-port="1" />
<edge from-layer="196" from-port="2" to-layer="197" to-port="1" />
<edge from-layer="197" from-port="2" to-layer="269" to-port="0" />
<edge from-layer="197" from-port="2" to-layer="199" to-port="0" />
<edge from-layer="198" from-port="0" to-layer="199" to-port="1" />
<edge from-layer="199" from-port="2" to-layer="201" to-port="0" />
<edge from-layer="200" from-port="0" to-layer="201" to-port="1" />
<edge from-layer="201" from-port="2" to-layer="203" to-port="0" />
<edge from-layer="202" from-port="0" to-layer="203" to-port="1" />
<edge from-layer="203" from-port="2" to-layer="214" to-port="0" />
<edge from-layer="204" from-port="0" to-layer="205" to-port="0" />
<edge from-layer="205" from-port="1" to-layer="208" to-port="0" />
<edge from-layer="206" from-port="0" to-layer="207" to-port="0" />
<edge from-layer="207" from-port="1" to-layer="208" to-port="1" />
<edge from-layer="208" from-port="2" to-layer="210" to-port="0" />
<edge from-layer="209" from-port="0" to-layer="210" to-port="1" />
<edge from-layer="210" from-port="2" to-layer="212" to-port="0" />
<edge from-layer="211" from-port="0" to-layer="212" to-port="1" />
<edge from-layer="212" from-port="2" to-layer="213" to-port="0" />
<edge from-layer="213" from-port="1" to-layer="214" to-port="1" />
<edge from-layer="214" from-port="2" to-layer="216" to-port="0" />
<edge from-layer="215" from-port="0" to-layer="216" to-port="1" />
<edge from-layer="216" from-port="2" to-layer="218" to-port="0" />
<edge from-layer="217" from-port="0" to-layer="218" to-port="1" />
<edge from-layer="218" from-port="2" to-layer="220" to-port="0" />
<edge from-layer="219" from-port="0" to-layer="220" to-port="1" />
<edge from-layer="220" from-port="2" to-layer="251" to-port="0" />
<edge from-layer="221" from-port="0" to-layer="222" to-port="0" />
<edge from-layer="222" from-port="1" to-layer="225" to-port="0" />
<edge from-layer="223" from-port="0" to-layer="224" to-port="0" />
<edge from-layer="224" from-port="1" to-layer="225" to-port="1" />
<edge from-layer="225" from-port="2" to-layer="227" to-port="0" />
<edge from-layer="226" from-port="0" to-layer="227" to-port="1" />
<edge from-layer="227" from-port="2" to-layer="229" to-port="0" />
<edge from-layer="228" from-port="0" to-layer="229" to-port="1" />
<edge from-layer="229" from-port="2" to-layer="230" to-port="0" />
<edge from-layer="230" from-port="1" to-layer="231" to-port="1" />
<edge from-layer="231" from-port="2" to-layer="232" to-port="0" />
<edge from-layer="232" from-port="2" to-layer="234" to-port="0" />
<edge from-layer="233" from-port="0" to-layer="234" to-port="1" />
<edge from-layer="234" from-port="2" to-layer="251" to-port="1" />
<edge from-layer="234" from-port="2" to-layer="713" to-port="0" />
<edge from-layer="235" from-port="0" to-layer="236" to-port="0" />
<edge from-layer="236" from-port="1" to-layer="239" to-port="0" />
<edge from-layer="237" from-port="0" to-layer="238" to-port="0" />
<edge from-layer="238" from-port="1" to-layer="239" to-port="1" />
<edge from-layer="239" from-port="2" to-layer="241" to-port="0" />
<edge from-layer="240" from-port="0" to-layer="241" to-port="1" />
<edge from-layer="241" from-port="2" to-layer="243" to-port="0" />
<edge from-layer="242" from-port="0" to-layer="243" to-port="1" />
<edge from-layer="243" from-port="2" to-layer="244" to-port="0" />
<edge from-layer="244" from-port="1" to-layer="245" to-port="1" />
<edge from-layer="245" from-port="2" to-layer="247" to-port="0" />
<edge from-layer="246" from-port="0" to-layer="247" to-port="1" />
<edge from-layer="247" from-port="2" to-layer="248" to-port="0" />
<edge from-layer="248" from-port="2" to-layer="250" to-port="0" />
<edge from-layer="249" from-port="0" to-layer="250" to-port="1" />
<edge from-layer="250" from-port="2" to-layer="712" to-port="0" />
<edge from-layer="250" from-port="2" to-layer="251" to-port="2" />
<edge from-layer="251" from-port="3" to-layer="253" to-port="0" />
<edge from-layer="252" from-port="0" to-layer="253" to-port="1" />
<edge from-layer="253" from-port="2" to-layer="255" to-port="0" />
<edge from-layer="254" from-port="0" to-layer="255" to-port="1" />
<edge from-layer="255" from-port="2" to-layer="266" to-port="0" />
<edge from-layer="256" from-port="0" to-layer="257" to-port="0" />
<edge from-layer="257" from-port="1" to-layer="260" to-port="0" />
<edge from-layer="258" from-port="0" to-layer="259" to-port="0" />
<edge from-layer="259" from-port="1" to-layer="260" to-port="1" />
<edge from-layer="260" from-port="2" to-layer="262" to-port="0" />
<edge from-layer="261" from-port="0" to-layer="262" to-port="1" />
<edge from-layer="262" from-port="2" to-layer="264" to-port="0" />
<edge from-layer="263" from-port="0" to-layer="264" to-port="1" />
<edge from-layer="264" from-port="2" to-layer="265" to-port="0" />
<edge from-layer="265" from-port="1" to-layer="266" to-port="1" />
<edge from-layer="266" from-port="2" to-layer="268" to-port="0" />
<edge from-layer="267" from-port="0" to-layer="268" to-port="1" />
<edge from-layer="268" from-port="2" to-layer="269" to-port="1" />
<edge from-layer="269" from-port="2" to-layer="303" to-port="0" />
<edge from-layer="269" from-port="2" to-layer="271" to-port="0" />
<edge from-layer="270" from-port="0" to-layer="271" to-port="1" />
<edge from-layer="271" from-port="2" to-layer="273" to-port="0" />
<edge from-layer="272" from-port="0" to-layer="273" to-port="1" />
<edge from-layer="273" from-port="2" to-layer="275" to-port="0" />
<edge from-layer="274" from-port="0" to-layer="275" to-port="1" />
<edge from-layer="275" from-port="2" to-layer="286" to-port="0" />
<edge from-layer="276" from-port="0" to-layer="277" to-port="0" />
<edge from-layer="277" from-port="1" to-layer="280" to-port="0" />
<edge from-layer="278" from-port="0" to-layer="279" to-port="0" />
<edge from-layer="279" from-port="1" to-layer="280" to-port="1" />
<edge from-layer="280" from-port="2" to-layer="282" to-port="0" />
<edge from-layer="281" from-port="0" to-layer="282" to-port="1" />
<edge from-layer="282" from-port="2" to-layer="284" to-port="0" />
<edge from-layer="283" from-port="0" to-layer="284" to-port="1" />
<edge from-layer="284" from-port="2" to-layer="285" to-port="0" />
<edge from-layer="285" from-port="1" to-layer="286" to-port="1" />
<edge from-layer="286" from-port="2" to-layer="288" to-port="0" />
<edge from-layer="287" from-port="0" to-layer="288" to-port="1" />
<edge from-layer="288" from-port="2" to-layer="289" to-port="0" />
<edge from-layer="289" from-port="1" to-layer="300" to-port="0" />
<edge from-layer="290" from-port="0" to-layer="291" to-port="0" />
<edge from-layer="291" from-port="1" to-layer="294" to-port="0" />
<edge from-layer="292" from-port="0" to-layer="293" to-port="0" />
<edge from-layer="293" from-port="1" to-layer="294" to-port="1" />
<edge from-layer="294" from-port="2" to-layer="296" to-port="0" />
<edge from-layer="295" from-port="0" to-layer="296" to-port="1" />
<edge from-layer="296" from-port="2" to-layer="298" to-port="0" />
<edge from-layer="297" from-port="0" to-layer="298" to-port="1" />
<edge from-layer="298" from-port="2" to-layer="299" to-port="0" />
<edge from-layer="299" from-port="1" to-layer="300" to-port="1" />
<edge from-layer="300" from-port="2" to-layer="302" to-port="0" />
<edge from-layer="301" from-port="0" to-layer="302" to-port="1" />
<edge from-layer="302" from-port="2" to-layer="303" to-port="1" />
<edge from-layer="303" from-port="2" to-layer="305" to-port="0" />
<edge from-layer="303" from-port="2" to-layer="377" to-port="0" />
<edge from-layer="304" from-port="0" to-layer="305" to-port="1" />
<edge from-layer="305" from-port="2" to-layer="307" to-port="0" />
<edge from-layer="306" from-port="0" to-layer="307" to-port="1" />
<edge from-layer="307" from-port="2" to-layer="309" to-port="0" />
<edge from-layer="308" from-port="0" to-layer="309" to-port="1" />
<edge from-layer="309" from-port="2" to-layer="352" to-port="0" />
<edge from-layer="309" from-port="2" to-layer="337" to-port="0" />
<edge from-layer="309" from-port="2" to-layer="320" to-port="0" />
<edge from-layer="310" from-port="0" to-layer="311" to-port="0" />
<edge from-layer="311" from-port="1" to-layer="314" to-port="0" />
<edge from-layer="312" from-port="0" to-layer="313" to-port="0" />
<edge from-layer="313" from-port="1" to-layer="314" to-port="1" />
<edge from-layer="314" from-port="2" to-layer="316" to-port="0" />
<edge from-layer="315" from-port="0" to-layer="316" to-port="1" />
<edge from-layer="316" from-port="2" to-layer="318" to-port="0" />
<edge from-layer="317" from-port="0" to-layer="318" to-port="1" />
<edge from-layer="318" from-port="2" to-layer="319" to-port="0" />
<edge from-layer="319" from-port="1" to-layer="320" to-port="1" />
<edge from-layer="320" from-port="2" to-layer="322" to-port="0" />
<edge from-layer="321" from-port="0" to-layer="322" to-port="1" />
<edge from-layer="322" from-port="2" to-layer="324" to-port="0" />
<edge from-layer="323" from-port="0" to-layer="324" to-port="1" />
<edge from-layer="324" from-port="2" to-layer="326" to-port="0" />
<edge from-layer="325" from-port="0" to-layer="326" to-port="1" />
<edge from-layer="326" from-port="2" to-layer="359" to-port="0" />
<edge from-layer="327" from-port="0" to-layer="328" to-port="0" />
<edge from-layer="328" from-port="1" to-layer="331" to-port="0" />
<edge from-layer="329" from-port="0" to-layer="330" to-port="0" />
<edge from-layer="330" from-port="1" to-layer="331" to-port="1" />
<edge from-layer="331" from-port="2" to-layer="333" to-port="0" />
<edge from-layer="332" from-port="0" to-layer="333" to-port="1" />
<edge from-layer="333" from-port="2" to-layer="335" to-port="0" />
<edge from-layer="334" from-port="0" to-layer="335" to-port="1" />
<edge from-layer="335" from-port="2" to-layer="336" to-port="0" />
<edge from-layer="336" from-port="1" to-layer="337" to-port="1" />
<edge from-layer="337" from-port="2" to-layer="339" to-port="0" />
<edge from-layer="338" from-port="0" to-layer="339" to-port="1" />
<edge from-layer="339" from-port="2" to-layer="341" to-port="0" />
<edge from-layer="340" from-port="0" to-layer="341" to-port="1" />
<edge from-layer="341" from-port="2" to-layer="359" to-port="1" />
<edge from-layer="341" from-port="2" to-layer="711" to-port="0" />
<edge from-layer="342" from-port="0" to-layer="343" to-port="0" />
<edge from-layer="343" from-port="1" to-layer="346" to-port="0" />
<edge from-layer="344" from-port="0" to-layer="345" to-port="0" />
<edge from-layer="345" from-port="1" to-layer="346" to-port="1" />
<edge from-layer="346" from-port="2" to-layer="348" to-port="0" />
<edge from-layer="347" from-port="0" to-layer="348" to-port="1" />
<edge from-layer="348" from-port="2" to-layer="350" to-port="0" />
<edge from-layer="349" from-port="0" to-layer="350" to-port="1" />
<edge from-layer="350" from-port="2" to-layer="351" to-port="0" />
<edge from-layer="351" from-port="1" to-layer="352" to-port="1" />
<edge from-layer="352" from-port="2" to-layer="354" to-port="0" />
<edge from-layer="353" from-port="0" to-layer="354" to-port="1" />
<edge from-layer="354" from-port="2" to-layer="356" to-port="0" />
<edge from-layer="355" from-port="0" to-layer="356" to-port="1" />
<edge from-layer="356" from-port="2" to-layer="358" to-port="0" />
<edge from-layer="357" from-port="0" to-layer="358" to-port="1" />
<edge from-layer="358" from-port="2" to-layer="359" to-port="2" />
<edge from-layer="358" from-port="2" to-layer="710" to-port="0" />
<edge from-layer="359" from-port="4" to-layer="361" to-port="0" />
<edge from-layer="360" from-port="0" to-layer="361" to-port="1" />
<edge from-layer="361" from-port="2" to-layer="363" to-port="0" />
<edge from-layer="362" from-port="0" to-layer="363" to-port="1" />
<edge from-layer="363" from-port="2" to-layer="374" to-port="0" />
<edge from-layer="364" from-port="0" to-layer="365" to-port="0" />
<edge from-layer="365" from-port="1" to-layer="368" to-port="0" />
<edge from-layer="366" from-port="0" to-layer="367" to-port="0" />
<edge from-layer="367" from-port="1" to-layer="368" to-port="1" />
<edge from-layer="368" from-port="2" to-layer="370" to-port="0" />
<edge from-layer="369" from-port="0" to-layer="370" to-port="1" />
<edge from-layer="370" from-port="2" to-layer="372" to-port="0" />
<edge from-layer="371" from-port="0" to-layer="372" to-port="1" />
<edge from-layer="372" from-port="2" to-layer="373" to-port="0" />
<edge from-layer="373" from-port="1" to-layer="374" to-port="1" />
<edge from-layer="374" from-port="2" to-layer="376" to-port="0" />
<edge from-layer="375" from-port="0" to-layer="376" to-port="1" />
<edge from-layer="376" from-port="2" to-layer="377" to-port="1" />
<edge from-layer="377" from-port="2" to-layer="449" to-port="0" />
<edge from-layer="377" from-port="2" to-layer="379" to-port="0" />
<edge from-layer="378" from-port="0" to-layer="379" to-port="1" />
<edge from-layer="379" from-port="2" to-layer="381" to-port="0" />
<edge from-layer="380" from-port="0" to-layer="381" to-port="1" />
<edge from-layer="381" from-port="2" to-layer="383" to-port="0" />
<edge from-layer="382" from-port="0" to-layer="383" to-port="1" />
<edge from-layer="383" from-port="2" to-layer="394" to-port="0" />
<edge from-layer="384" from-port="0" to-layer="385" to-port="0" />
<edge from-layer="385" from-port="1" to-layer="388" to-port="0" />
<edge from-layer="386" from-port="0" to-layer="387" to-port="0" />
<edge from-layer="387" from-port="1" to-layer="388" to-port="1" />
<edge from-layer="388" from-port="2" to-layer="390" to-port="0" />
<edge from-layer="389" from-port="0" to-layer="390" to-port="1" />
<edge from-layer="390" from-port="2" to-layer="392" to-port="0" />
<edge from-layer="391" from-port="0" to-layer="392" to-port="1" />
<edge from-layer="392" from-port="2" to-layer="393" to-port="0" />
<edge from-layer="393" from-port="1" to-layer="394" to-port="1" />
<edge from-layer="394" from-port="2" to-layer="396" to-port="0" />
<edge from-layer="395" from-port="0" to-layer="396" to-port="1" />
<edge from-layer="396" from-port="2" to-layer="398" to-port="0" />
<edge from-layer="397" from-port="0" to-layer="398" to-port="1" />
<edge from-layer="398" from-port="2" to-layer="400" to-port="0" />
<edge from-layer="399" from-port="0" to-layer="400" to-port="1" />
<edge from-layer="400" from-port="2" to-layer="431" to-port="0" />
<edge from-layer="401" from-port="0" to-layer="402" to-port="0" />
<edge from-layer="402" from-port="1" to-layer="405" to-port="0" />
<edge from-layer="403" from-port="0" to-layer="404" to-port="0" />
<edge from-layer="404" from-port="1" to-layer="405" to-port="1" />
<edge from-layer="405" from-port="2" to-layer="407" to-port="0" />
<edge from-layer="406" from-port="0" to-layer="407" to-port="1" />
<edge from-layer="407" from-port="2" to-layer="409" to-port="0" />
<edge from-layer="408" from-port="0" to-layer="409" to-port="1" />
<edge from-layer="409" from-port="2" to-layer="410" to-port="0" />
<edge from-layer="410" from-port="1" to-layer="411" to-port="1" />
<edge from-layer="411" from-port="2" to-layer="412" to-port="0" />
<edge from-layer="412" from-port="2" to-layer="414" to-port="0" />
<edge from-layer="413" from-port="0" to-layer="414" to-port="1" />
<edge from-layer="414" from-port="2" to-layer="709" to-port="0" />
<edge from-layer="414" from-port="2" to-layer="431" to-port="1" />
<edge from-layer="415" from-port="0" to-layer="416" to-port="0" />
<edge from-layer="416" from-port="1" to-layer="419" to-port="0" />
<edge from-layer="417" from-port="0" to-layer="418" to-port="0" />
<edge from-layer="418" from-port="1" to-layer="419" to-port="1" />
<edge from-layer="419" from-port="2" to-layer="421" to-port="0" />
<edge from-layer="420" from-port="0" to-layer="421" to-port="1" />
<edge from-layer="421" from-port="2" to-layer="423" to-port="0" />
<edge from-layer="422" from-port="0" to-layer="423" to-port="1" />
<edge from-layer="423" from-port="2" to-layer="424" to-port="0" />
<edge from-layer="424" from-port="1" to-layer="425" to-port="1" />
<edge from-layer="425" from-port="2" to-layer="427" to-port="0" />
<edge from-layer="426" from-port="0" to-layer="427" to-port="1" />
<edge from-layer="427" from-port="2" to-layer="428" to-port="0" />
<edge from-layer="428" from-port="2" to-layer="430" to-port="0" />
<edge from-layer="429" from-port="0" to-layer="430" to-port="1" />
<edge from-layer="430" from-port="2" to-layer="431" to-port="2" />
<edge from-layer="430" from-port="2" to-layer="708" to-port="0" />
<edge from-layer="431" from-port="3" to-layer="433" to-port="0" />
<edge from-layer="432" from-port="0" to-layer="433" to-port="1" />
<edge from-layer="433" from-port="2" to-layer="435" to-port="0" />
<edge from-layer="434" from-port="0" to-layer="435" to-port="1" />
<edge from-layer="435" from-port="2" to-layer="446" to-port="0" />
<edge from-layer="436" from-port="0" to-layer="437" to-port="0" />
<edge from-layer="437" from-port="1" to-layer="440" to-port="0" />
<edge from-layer="438" from-port="0" to-layer="439" to-port="0" />
<edge from-layer="439" from-port="1" to-layer="440" to-port="1" />
<edge from-layer="440" from-port="2" to-layer="442" to-port="0" />
<edge from-layer="441" from-port="0" to-layer="442" to-port="1" />
<edge from-layer="442" from-port="2" to-layer="444" to-port="0" />
<edge from-layer="443" from-port="0" to-layer="444" to-port="1" />
<edge from-layer="444" from-port="2" to-layer="445" to-port="0" />
<edge from-layer="445" from-port="1" to-layer="446" to-port="1" />
<edge from-layer="446" from-port="2" to-layer="448" to-port="0" />
<edge from-layer="447" from-port="0" to-layer="448" to-port="1" />
<edge from-layer="448" from-port="2" to-layer="449" to-port="1" />
<edge from-layer="449" from-port="2" to-layer="483" to-port="0" />
<edge from-layer="449" from-port="2" to-layer="451" to-port="0" />
<edge from-layer="450" from-port="0" to-layer="451" to-port="1" />
<edge from-layer="451" from-port="2" to-layer="453" to-port="0" />
<edge from-layer="452" from-port="0" to-layer="453" to-port="1" />
<edge from-layer="453" from-port="2" to-layer="455" to-port="0" />
<edge from-layer="454" from-port="0" to-layer="455" to-port="1" />
<edge from-layer="455" from-port="2" to-layer="466" to-port="0" />
<edge from-layer="456" from-port="0" to-layer="457" to-port="0" />
<edge from-layer="457" from-port="1" to-layer="460" to-port="0" />
<edge from-layer="458" from-port="0" to-layer="459" to-port="0" />
<edge from-layer="459" from-port="1" to-layer="460" to-port="1" />
<edge from-layer="460" from-port="2" to-layer="462" to-port="0" />
<edge from-layer="461" from-port="0" to-layer="462" to-port="1" />
<edge from-layer="462" from-port="2" to-layer="464" to-port="0" />
<edge from-layer="463" from-port="0" to-layer="464" to-port="1" />
<edge from-layer="464" from-port="2" to-layer="465" to-port="0" />
<edge from-layer="465" from-port="1" to-layer="466" to-port="1" />
<edge from-layer="466" from-port="2" to-layer="468" to-port="0" />
<edge from-layer="467" from-port="0" to-layer="468" to-port="1" />
<edge from-layer="468" from-port="2" to-layer="469" to-port="0" />
<edge from-layer="469" from-port="1" to-layer="480" to-port="0" />
<edge from-layer="470" from-port="0" to-layer="471" to-port="0" />
<edge from-layer="471" from-port="1" to-layer="474" to-port="0" />
<edge from-layer="472" from-port="0" to-layer="473" to-port="0" />
<edge from-layer="473" from-port="1" to-layer="474" to-port="1" />
<edge from-layer="474" from-port="2" to-layer="476" to-port="0" />
<edge from-layer="475" from-port="0" to-layer="476" to-port="1" />
<edge from-layer="476" from-port="2" to-layer="478" to-port="0" />
<edge from-layer="477" from-port="0" to-layer="478" to-port="1" />
<edge from-layer="478" from-port="2" to-layer="479" to-port="0" />
<edge from-layer="479" from-port="1" to-layer="480" to-port="1" />
<edge from-layer="480" from-port="2" to-layer="482" to-port="0" />
<edge from-layer="481" from-port="0" to-layer="482" to-port="1" />
<edge from-layer="482" from-port="2" to-layer="483" to-port="1" />
<edge from-layer="483" from-port="2" to-layer="485" to-port="0" />
<edge from-layer="483" from-port="2" to-layer="557" to-port="0" />
<edge from-layer="484" from-port="0" to-layer="485" to-port="1" />
<edge from-layer="485" from-port="2" to-layer="487" to-port="0" />
<edge from-layer="486" from-port="0" to-layer="487" to-port="1" />
<edge from-layer="487" from-port="2" to-layer="489" to-port="0" />
<edge from-layer="488" from-port="0" to-layer="489" to-port="1" />
<edge from-layer="489" from-port="2" to-layer="532" to-port="0" />
<edge from-layer="489" from-port="2" to-layer="517" to-port="0" />
<edge from-layer="489" from-port="2" to-layer="500" to-port="0" />
<edge from-layer="490" from-port="0" to-layer="491" to-port="0" />
<edge from-layer="491" from-port="1" to-layer="494" to-port="0" />
<edge from-layer="492" from-port="0" to-layer="493" to-port="0" />
<edge from-layer="493" from-port="1" to-layer="494" to-port="1" />
<edge from-layer="494" from-port="2" to-layer="496" to-port="0" />
<edge from-layer="495" from-port="0" to-layer="496" to-port="1" />
<edge from-layer="496" from-port="2" to-layer="498" to-port="0" />
<edge from-layer="497" from-port="0" to-layer="498" to-port="1" />
<edge from-layer="498" from-port="2" to-layer="499" to-port="0" />
<edge from-layer="499" from-port="1" to-layer="500" to-port="1" />
<edge from-layer="500" from-port="2" to-layer="502" to-port="0" />
<edge from-layer="501" from-port="0" to-layer="502" to-port="1" />
<edge from-layer="502" from-port="2" to-layer="504" to-port="0" />
<edge from-layer="503" from-port="0" to-layer="504" to-port="1" />
<edge from-layer="504" from-port="2" to-layer="506" to-port="0" />
<edge from-layer="505" from-port="0" to-layer="506" to-port="1" />
<edge from-layer="506" from-port="2" to-layer="539" to-port="0" />
<edge from-layer="507" from-port="0" to-layer="508" to-port="0" />
<edge from-layer="508" from-port="1" to-layer="511" to-port="0" />
<edge from-layer="509" from-port="0" to-layer="510" to-port="0" />
<edge from-layer="510" from-port="1" to-layer="511" to-port="1" />
<edge from-layer="511" from-port="2" to-layer="513" to-port="0" />
<edge from-layer="512" from-port="0" to-layer="513" to-port="1" />
<edge from-layer="513" from-port="2" to-layer="515" to-port="0" />
<edge from-layer="514" from-port="0" to-layer="515" to-port="1" />
<edge from-layer="515" from-port="2" to-layer="516" to-port="0" />
<edge from-layer="516" from-port="1" to-layer="517" to-port="1" />
<edge from-layer="517" from-port="2" to-layer="519" to-port="0" />
<edge from-layer="518" from-port="0" to-layer="519" to-port="1" />
<edge from-layer="519" from-port="2" to-layer="521" to-port="0" />
<edge from-layer="520" from-port="0" to-layer="521" to-port="1" />
<edge from-layer="521" from-port="2" to-layer="539" to-port="1" />
<edge from-layer="521" from-port="2" to-layer="707" to-port="0" />
<edge from-layer="522" from-port="0" to-layer="523" to-port="0" />
<edge from-layer="523" from-port="1" to-layer="526" to-port="0" />
<edge from-layer="524" from-port="0" to-layer="525" to-port="0" />
<edge from-layer="525" from-port="1" to-layer="526" to-port="1" />
<edge from-layer="526" from-port="2" to-layer="528" to-port="0" />
<edge from-layer="527" from-port="0" to-layer="528" to-port="1" />
<edge from-layer="528" from-port="2" to-layer="530" to-port="0" />
<edge from-layer="529" from-port="0" to-layer="530" to-port="1" />
<edge from-layer="530" from-port="2" to-layer="531" to-port="0" />
<edge from-layer="531" from-port="1" to-layer="532" to-port="1" />
<edge from-layer="532" from-port="2" to-layer="534" to-port="0" />
<edge from-layer="533" from-port="0" to-layer="534" to-port="1" />
<edge from-layer="534" from-port="2" to-layer="536" to-port="0" />
<edge from-layer="535" from-port="0" to-layer="536" to-port="1" />
<edge from-layer="536" from-port="2" to-layer="538" to-port="0" />
<edge from-layer="537" from-port="0" to-layer="538" to-port="1" />
<edge from-layer="538" from-port="2" to-layer="706" to-port="0" />
<edge from-layer="538" from-port="2" to-layer="539" to-port="2" />
<edge from-layer="539" from-port="4" to-layer="541" to-port="0" />
<edge from-layer="540" from-port="0" to-layer="541" to-port="1" />
<edge from-layer="541" from-port="2" to-layer="543" to-port="0" />
<edge from-layer="542" from-port="0" to-layer="543" to-port="1" />
<edge from-layer="543" from-port="2" to-layer="554" to-port="0" />
<edge from-layer="544" from-port="0" to-layer="545" to-port="0" />
<edge from-layer="545" from-port="1" to-layer="548" to-port="0" />
<edge from-layer="546" from-port="0" to-layer="547" to-port="0" />
<edge from-layer="547" from-port="1" to-layer="548" to-port="1" />
<edge from-layer="548" from-port="2" to-layer="550" to-port="0" />
<edge from-layer="549" from-port="0" to-layer="550" to-port="1" />
<edge from-layer="550" from-port="2" to-layer="552" to-port="0" />
<edge from-layer="551" from-port="0" to-layer="552" to-port="1" />
<edge from-layer="552" from-port="2" to-layer="553" to-port="0" />
<edge from-layer="553" from-port="1" to-layer="554" to-port="1" />
<edge from-layer="554" from-port="2" to-layer="556" to-port="0" />
<edge from-layer="555" from-port="0" to-layer="556" to-port="1" />
<edge from-layer="556" from-port="2" to-layer="557" to-port="1" />
<edge from-layer="557" from-port="2" to-layer="629" to-port="0" />
<edge from-layer="557" from-port="2" to-layer="559" to-port="0" />
<edge from-layer="558" from-port="0" to-layer="559" to-port="1" />
<edge from-layer="559" from-port="2" to-layer="561" to-port="0" />
<edge from-layer="560" from-port="0" to-layer="561" to-port="1" />
<edge from-layer="561" from-port="2" to-layer="563" to-port="0" />
<edge from-layer="562" from-port="0" to-layer="563" to-port="1" />
<edge from-layer="563" from-port="2" to-layer="574" to-port="0" />
<edge from-layer="564" from-port="0" to-layer="565" to-port="0" />
<edge from-layer="565" from-port="1" to-layer="568" to-port="0" />
<edge from-layer="566" from-port="0" to-layer="567" to-port="0" />
<edge from-layer="567" from-port="1" to-layer="568" to-port="1" />
<edge from-layer="568" from-port="2" to-layer="570" to-port="0" />
<edge from-layer="569" from-port="0" to-layer="570" to-port="1" />
<edge from-layer="570" from-port="2" to-layer="572" to-port="0" />
<edge from-layer="571" from-port="0" to-layer="572" to-port="1" />
<edge from-layer="572" from-port="2" to-layer="573" to-port="0" />
<edge from-layer="573" from-port="1" to-layer="574" to-port="1" />
<edge from-layer="574" from-port="2" to-layer="576" to-port="0" />
<edge from-layer="575" from-port="0" to-layer="576" to-port="1" />
<edge from-layer="576" from-port="2" to-layer="578" to-port="0" />
<edge from-layer="577" from-port="0" to-layer="578" to-port="1" />
<edge from-layer="578" from-port="2" to-layer="580" to-port="0" />
<edge from-layer="579" from-port="0" to-layer="580" to-port="1" />
<edge from-layer="580" from-port="2" to-layer="611" to-port="0" />
<edge from-layer="581" from-port="0" to-layer="582" to-port="0" />
<edge from-layer="582" from-port="1" to-layer="585" to-port="0" />
<edge from-layer="583" from-port="0" to-layer="584" to-port="0" />
<edge from-layer="584" from-port="1" to-layer="585" to-port="1" />
<edge from-layer="585" from-port="2" to-layer="587" to-port="0" />
<edge from-layer="586" from-port="0" to-layer="587" to-port="1" />
<edge from-layer="587" from-port="2" to-layer="589" to-port="0" />
<edge from-layer="588" from-port="0" to-layer="589" to-port="1" />
<edge from-layer="589" from-port="2" to-layer="590" to-port="0" />
<edge from-layer="590" from-port="1" to-layer="591" to-port="1" />
<edge from-layer="591" from-port="2" to-layer="592" to-port="0" />
<edge from-layer="592" from-port="2" to-layer="594" to-port="0" />
<edge from-layer="593" from-port="0" to-layer="594" to-port="1" />
<edge from-layer="594" from-port="2" to-layer="705" to-port="0" />
<edge from-layer="594" from-port="2" to-layer="611" to-port="1" />
<edge from-layer="595" from-port="0" to-layer="596" to-port="0" />
<edge from-layer="596" from-port="1" to-layer="599" to-port="0" />
<edge from-layer="597" from-port="0" to-layer="598" to-port="0" />
<edge from-layer="598" from-port="1" to-layer="599" to-port="1" />
<edge from-layer="599" from-port="2" to-layer="601" to-port="0" />
<edge from-layer="600" from-port="0" to-layer="601" to-port="1" />
<edge from-layer="601" from-port="2" to-layer="603" to-port="0" />
<edge from-layer="602" from-port="0" to-layer="603" to-port="1" />
<edge from-layer="603" from-port="2" to-layer="604" to-port="0" />
<edge from-layer="604" from-port="1" to-layer="605" to-port="1" />
<edge from-layer="605" from-port="2" to-layer="607" to-port="0" />
<edge from-layer="606" from-port="0" to-layer="607" to-port="1" />
<edge from-layer="607" from-port="2" to-layer="608" to-port="0" />
<edge from-layer="608" from-port="2" to-layer="610" to-port="0" />
<edge from-layer="609" from-port="0" to-layer="610" to-port="1" />
<edge from-layer="610" from-port="2" to-layer="704" to-port="0" />
<edge from-layer="610" from-port="2" to-layer="611" to-port="2" />
<edge from-layer="611" from-port="3" to-layer="613" to-port="0" />
<edge from-layer="612" from-port="0" to-layer="613" to-port="1" />
<edge from-layer="613" from-port="2" to-layer="615" to-port="0" />
<edge from-layer="614" from-port="0" to-layer="615" to-port="1" />
<edge from-layer="615" from-port="2" to-layer="626" to-port="0" />
<edge from-layer="616" from-port="0" to-layer="617" to-port="0" />
<edge from-layer="617" from-port="1" to-layer="620" to-port="0" />
<edge from-layer="618" from-port="0" to-layer="619" to-port="0" />
<edge from-layer="619" from-port="1" to-layer="620" to-port="1" />
<edge from-layer="620" from-port="2" to-layer="622" to-port="0" />
<edge from-layer="621" from-port="0" to-layer="622" to-port="1" />
<edge from-layer="622" from-port="2" to-layer="624" to-port="0" />
<edge from-layer="623" from-port="0" to-layer="624" to-port="1" />
<edge from-layer="624" from-port="2" to-layer="625" to-port="0" />
<edge from-layer="625" from-port="1" to-layer="626" to-port="1" />
<edge from-layer="626" from-port="2" to-layer="628" to-port="0" />
<edge from-layer="627" from-port="0" to-layer="628" to-port="1" />
<edge from-layer="628" from-port="2" to-layer="629" to-port="1" />
<edge from-layer="629" from-port="2" to-layer="631" to-port="0" />
<edge from-layer="629" from-port="2" to-layer="663" to-port="0" />
<edge from-layer="630" from-port="0" to-layer="631" to-port="1" />
<edge from-layer="631" from-port="2" to-layer="633" to-port="0" />
<edge from-layer="632" from-port="0" to-layer="633" to-port="1" />
<edge from-layer="633" from-port="2" to-layer="635" to-port="0" />
<edge from-layer="634" from-port="0" to-layer="635" to-port="1" />
<edge from-layer="635" from-port="2" to-layer="646" to-port="0" />
<edge from-layer="636" from-port="0" to-layer="637" to-port="0" />
<edge from-layer="637" from-port="1" to-layer="640" to-port="0" />
<edge from-layer="638" from-port="0" to-layer="639" to-port="0" />
<edge from-layer="639" from-port="1" to-layer="640" to-port="1" />
<edge from-layer="640" from-port="2" to-layer="642" to-port="0" />
<edge from-layer="641" from-port="0" to-layer="642" to-port="1" />
<edge from-layer="642" from-port="2" to-layer="644" to-port="0" />
<edge from-layer="643" from-port="0" to-layer="644" to-port="1" />
<edge from-layer="644" from-port="2" to-layer="645" to-port="0" />
<edge from-layer="645" from-port="1" to-layer="646" to-port="1" />
<edge from-layer="646" from-port="2" to-layer="648" to-port="0" />
<edge from-layer="647" from-port="0" to-layer="648" to-port="1" />
<edge from-layer="648" from-port="2" to-layer="649" to-port="0" />
<edge from-layer="649" from-port="1" to-layer="660" to-port="0" />
<edge from-layer="650" from-port="0" to-layer="651" to-port="0" />
<edge from-layer="651" from-port="1" to-layer="654" to-port="0" />
<edge from-layer="652" from-port="0" to-layer="653" to-port="0" />
<edge from-layer="653" from-port="1" to-layer="654" to-port="1" />
<edge from-layer="654" from-port="2" to-layer="656" to-port="0" />
<edge from-layer="655" from-port="0" to-layer="656" to-port="1" />
<edge from-layer="656" from-port="2" to-layer="658" to-port="0" />
<edge from-layer="657" from-port="0" to-layer="658" to-port="1" />
<edge from-layer="658" from-port="2" to-layer="659" to-port="0" />
<edge from-layer="659" from-port="1" to-layer="660" to-port="1" />
<edge from-layer="660" from-port="2" to-layer="662" to-port="0" />
<edge from-layer="661" from-port="0" to-layer="662" to-port="1" />
<edge from-layer="662" from-port="2" to-layer="663" to-port="1" />
<edge from-layer="663" from-port="2" to-layer="751" to-port="0" />
<edge from-layer="663" from-port="2" to-layer="665" to-port="0" />
<edge from-layer="664" from-port="0" to-layer="665" to-port="1" />
<edge from-layer="665" from-port="2" to-layer="667" to-port="0" />
<edge from-layer="666" from-port="0" to-layer="667" to-port="1" />
<edge from-layer="667" from-port="2" to-layer="669" to-port="0" />
<edge from-layer="668" from-port="0" to-layer="669" to-port="1" />
<edge from-layer="669" from-port="2" to-layer="726" to-port="0" />
<edge from-layer="669" from-port="2" to-layer="680" to-port="0" />
<edge from-layer="669" from-port="2" to-layer="698" to-port="0" />
<edge from-layer="670" from-port="0" to-layer="671" to-port="0" />
<edge from-layer="671" from-port="1" to-layer="674" to-port="0" />
<edge from-layer="672" from-port="0" to-layer="673" to-port="0" />
<edge from-layer="673" from-port="1" to-layer="674" to-port="1" />
<edge from-layer="674" from-port="2" to-layer="676" to-port="0" />
<edge from-layer="675" from-port="0" to-layer="676" to-port="1" />
<edge from-layer="676" from-port="2" to-layer="678" to-port="0" />
<edge from-layer="677" from-port="0" to-layer="678" to-port="1" />
<edge from-layer="678" from-port="2" to-layer="679" to-port="0" />
<edge from-layer="679" from-port="1" to-layer="680" to-port="1" />
<edge from-layer="680" from-port="2" to-layer="682" to-port="0" />
<edge from-layer="681" from-port="0" to-layer="682" to-port="1" />
<edge from-layer="682" from-port="2" to-layer="684" to-port="0" />
<edge from-layer="683" from-port="0" to-layer="684" to-port="1" />
<edge from-layer="684" from-port="2" to-layer="686" to-port="0" />
<edge from-layer="685" from-port="0" to-layer="686" to-port="1" />
<edge from-layer="686" from-port="2" to-layer="687" to-port="0" />
<edge from-layer="686" from-port="2" to-layer="733" to-port="2" />
<edge from-layer="688" from-port="0" to-layer="689" to-port="0" />
<edge from-layer="689" from-port="1" to-layer="692" to-port="0" />
<edge from-layer="690" from-port="0" to-layer="691" to-port="0" />
<edge from-layer="691" from-port="1" to-layer="692" to-port="1" />
<edge from-layer="692" from-port="2" to-layer="694" to-port="0" />
<edge from-layer="693" from-port="0" to-layer="694" to-port="1" />
<edge from-layer="694" from-port="2" to-layer="696" to-port="0" />
<edge from-layer="695" from-port="0" to-layer="696" to-port="1" />
<edge from-layer="696" from-port="2" to-layer="697" to-port="0" />
<edge from-layer="697" from-port="1" to-layer="698" to-port="1" />
<edge from-layer="698" from-port="2" to-layer="700" to-port="0" />
<edge from-layer="699" from-port="0" to-layer="700" to-port="1" />
<edge from-layer="700" from-port="2" to-layer="702" to-port="0" />
<edge from-layer="701" from-port="0" to-layer="702" to-port="1" />
<edge from-layer="702" from-port="2" to-layer="733" to-port="1" />
<edge from-layer="702" from-port="2" to-layer="703" to-port="0" />
<edge from-layer="716" from-port="0" to-layer="717" to-port="0" />
<edge from-layer="717" from-port="1" to-layer="720" to-port="0" />
<edge from-layer="718" from-port="0" to-layer="719" to-port="0" />
<edge from-layer="719" from-port="1" to-layer="720" to-port="1" />
<edge from-layer="720" from-port="2" to-layer="722" to-port="0" />
<edge from-layer="721" from-port="0" to-layer="722" to-port="1" />
<edge from-layer="722" from-port="2" to-layer="724" to-port="0" />
<edge from-layer="723" from-port="0" to-layer="724" to-port="1" />
<edge from-layer="724" from-port="2" to-layer="725" to-port="0" />
<edge from-layer="725" from-port="1" to-layer="726" to-port="1" />
<edge from-layer="726" from-port="2" to-layer="728" to-port="0" />
<edge from-layer="727" from-port="0" to-layer="728" to-port="1" />
<edge from-layer="728" from-port="2" to-layer="730" to-port="0" />
<edge from-layer="729" from-port="0" to-layer="730" to-port="1" />
<edge from-layer="730" from-port="2" to-layer="732" to-port="0" />
<edge from-layer="731" from-port="0" to-layer="732" to-port="1" />
<edge from-layer="732" from-port="2" to-layer="733" to-port="0" />
<edge from-layer="733" from-port="4" to-layer="735" to-port="0" />
<edge from-layer="734" from-port="0" to-layer="735" to-port="1" />
<edge from-layer="735" from-port="2" to-layer="737" to-port="0" />
<edge from-layer="736" from-port="0" to-layer="737" to-port="1" />
<edge from-layer="737" from-port="2" to-layer="748" to-port="0" />
<edge from-layer="738" from-port="0" to-layer="739" to-port="0" />
<edge from-layer="739" from-port="1" to-layer="742" to-port="0" />
<edge from-layer="740" from-port="0" to-layer="741" to-port="0" />
<edge from-layer="741" from-port="1" to-layer="742" to-port="1" />
<edge from-layer="742" from-port="2" to-layer="744" to-port="0" />
<edge from-layer="743" from-port="0" to-layer="744" to-port="1" />
<edge from-layer="744" from-port="2" to-layer="746" to-port="0" />
<edge from-layer="745" from-port="0" to-layer="746" to-port="1" />
<edge from-layer="746" from-port="2" to-layer="747" to-port="0" />
<edge from-layer="747" from-port="1" to-layer="748" to-port="1" />
<edge from-layer="748" from-port="2" to-layer="750" to-port="0" />
<edge from-layer="749" from-port="0" to-layer="750" to-port="1" />
<edge from-layer="750" from-port="2" to-layer="751" to-port="1" />
<edge from-layer="751" from-port="2" to-layer="793" to-port="0" />
<edge from-layer="751" from-port="2" to-layer="753" to-port="0" />
<edge from-layer="752" from-port="0" to-layer="753" to-port="1" />
<edge from-layer="753" from-port="2" to-layer="755" to-port="0" />
<edge from-layer="754" from-port="0" to-layer="755" to-port="1" />
<edge from-layer="755" from-port="2" to-layer="757" to-port="0" />
<edge from-layer="756" from-port="0" to-layer="757" to-port="1" />
<edge from-layer="757" from-port="2" to-layer="768" to-port="0" />
<edge from-layer="758" from-port="0" to-layer="759" to-port="0" />
<edge from-layer="759" from-port="1" to-layer="762" to-port="0" />
<edge from-layer="760" from-port="0" to-layer="761" to-port="0" />
<edge from-layer="761" from-port="1" to-layer="762" to-port="1" />
<edge from-layer="762" from-port="2" to-layer="764" to-port="0" />
<edge from-layer="763" from-port="0" to-layer="764" to-port="1" />
<edge from-layer="764" from-port="2" to-layer="766" to-port="0" />
<edge from-layer="765" from-port="0" to-layer="766" to-port="1" />
<edge from-layer="766" from-port="2" to-layer="767" to-port="0" />
<edge from-layer="767" from-port="1" to-layer="768" to-port="1" />
<edge from-layer="768" from-port="2" to-layer="770" to-port="0" />
<edge from-layer="769" from-port="0" to-layer="770" to-port="1" />
<edge from-layer="770" from-port="2" to-layer="772" to-port="0" />
<edge from-layer="771" from-port="0" to-layer="772" to-port="1" />
<edge from-layer="772" from-port="2" to-layer="774" to-port="0" />
<edge from-layer="773" from-port="0" to-layer="774" to-port="1" />
<edge from-layer="774" from-port="2" to-layer="775" to-port="0" />
<edge from-layer="775" from-port="3" to-layer="777" to-port="0" />
<edge from-layer="776" from-port="0" to-layer="777" to-port="1" />
<edge from-layer="777" from-port="2" to-layer="779" to-port="0" />
<edge from-layer="778" from-port="0" to-layer="779" to-port="1" />
<edge from-layer="779" from-port="2" to-layer="790" to-port="0" />
<edge from-layer="780" from-port="0" to-layer="781" to-port="0" />
<edge from-layer="781" from-port="1" to-layer="784" to-port="0" />
<edge from-layer="782" from-port="0" to-layer="783" to-port="0" />
<edge from-layer="783" from-port="1" to-layer="784" to-port="1" />
<edge from-layer="784" from-port="2" to-layer="786" to-port="0" />
<edge from-layer="785" from-port="0" to-layer="786" to-port="1" />
<edge from-layer="786" from-port="2" to-layer="788" to-port="0" />
<edge from-layer="787" from-port="0" to-layer="788" to-port="1" />
<edge from-layer="788" from-port="2" to-layer="789" to-port="0" />
<edge from-layer="789" from-port="1" to-layer="790" to-port="1" />
<edge from-layer="790" from-port="2" to-layer="792" to-port="0" />
<edge from-layer="791" from-port="0" to-layer="792" to-port="1" />
<edge from-layer="792" from-port="2" to-layer="793" to-port="1" />
<edge from-layer="793" from-port="2" to-layer="795" to-port="0" />
<edge from-layer="793" from-port="2" to-layer="827" to-port="0" />
<edge from-layer="794" from-port="0" to-layer="795" to-port="1" />
<edge from-layer="795" from-port="2" to-layer="797" to-port="0" />
<edge from-layer="796" from-port="0" to-layer="797" to-port="1" />
<edge from-layer="797" from-port="2" to-layer="799" to-port="0" />
<edge from-layer="798" from-port="0" to-layer="799" to-port="1" />
<edge from-layer="799" from-port="2" to-layer="810" to-port="0" />
<edge from-layer="800" from-port="0" to-layer="801" to-port="0" />
<edge from-layer="801" from-port="1" to-layer="804" to-port="0" />
<edge from-layer="802" from-port="0" to-layer="803" to-port="0" />
<edge from-layer="803" from-port="1" to-layer="804" to-port="1" />
<edge from-layer="804" from-port="2" to-layer="806" to-port="0" />
<edge from-layer="805" from-port="0" to-layer="806" to-port="1" />
<edge from-layer="806" from-port="2" to-layer="808" to-port="0" />
<edge from-layer="807" from-port="0" to-layer="808" to-port="1" />
<edge from-layer="808" from-port="2" to-layer="809" to-port="0" />
<edge from-layer="809" from-port="1" to-layer="810" to-port="1" />
<edge from-layer="810" from-port="2" to-layer="812" to-port="0" />
<edge from-layer="811" from-port="0" to-layer="812" to-port="1" />
<edge from-layer="812" from-port="2" to-layer="813" to-port="0" />
<edge from-layer="813" from-port="1" to-layer="824" to-port="0" />
<edge from-layer="814" from-port="0" to-layer="815" to-port="0" />
<edge from-layer="815" from-port="1" to-layer="818" to-port="0" />
<edge from-layer="816" from-port="0" to-layer="817" to-port="0" />
<edge from-layer="817" from-port="1" to-layer="818" to-port="1" />
<edge from-layer="818" from-port="2" to-layer="820" to-port="0" />
<edge from-layer="819" from-port="0" to-layer="820" to-port="1" />
<edge from-layer="820" from-port="2" to-layer="822" to-port="0" />
<edge from-layer="821" from-port="0" to-layer="822" to-port="1" />
<edge from-layer="822" from-port="2" to-layer="823" to-port="0" />
<edge from-layer="823" from-port="1" to-layer="824" to-port="1" />
<edge from-layer="824" from-port="2" to-layer="826" to-port="0" />
<edge from-layer="825" from-port="0" to-layer="826" to-port="1" />
<edge from-layer="826" from-port="2" to-layer="827" to-port="1" />
<edge from-layer="827" from-port="2" to-layer="829" to-port="0" />
<edge from-layer="828" from-port="0" to-layer="829" to-port="1" />
<edge from-layer="829" from-port="2" to-layer="831" to-port="0" />
<edge from-layer="830" from-port="0" to-layer="831" to-port="1" />
<edge from-layer="831" from-port="2" to-layer="833" to-port="0" />
<edge from-layer="832" from-port="0" to-layer="833" to-port="1" />
<edge from-layer="833" from-port="2" to-layer="834" to-port="0" />
<edge from-layer="834" from-port="2" to-layer="835" to-port="0" />
</edges>
<rt_info>
<Runtime_version value="2025.2.0-19140-c01cd93e24d-releases/2025/2" />
<conversion_parameters>
<framework value="pytorch" />
<is_python_object value="True" />
</conversion_parameters>
<nncf>
<friendly_names_were_updated value="True" />
<version value="2.17.0" />
<weight_compression>
<advanced_parameters value="{'statistics_path': None, 'awq_params': {'subset_size': 32, 'percent_to_apply': 0.002, 'alpha_min': 0.0, 'alpha_max': 1.0, 'steps': 100, 'prefer_data_aware_scaling': True}, 'scale_estimation_params': {'subset_size': 64, 'initial_steps': 5, 'scale_steps': 5, 'weight_penalty': -1.0}, 'gptq_params': {'damp_percent': 0.1, 'block_size': 128, 'subset_size': 128}, 'lora_correction_params': {'adapter_rank': 8, 'num_iterations': 3, 'apply_regularization': True, 'subset_size': 128, 'use_int8_adapters': True}, 'lora_adapter_rank': 256, 'backend_params': {}}" />
<all_layers value="False" />
<awq value="False" />
<backup_mode value="int8_asym" />
<compression_format value="dequantize" />
<gptq value="False" />
<group_size value="128" />
<ignored_scope value="[]" />
<lora_correction value="False" />
<mode value="int4_asym" />
<ratio value="1.0" />
<scale_estimation value="False" />
<sensitivity_metric value="weight_quantization_error" />
</weight_compression>
</nncf>
<optimum>
<nncf_version value="2.17.0" />
<optimum_intel_version value="1.24.0" />
<optimum_version value="1.26.1" />
<pytorch_version value="2.7.1" />
<transformers_version value="4.52.4" />
</optimum>
</rt_info>
</net>